{
 "cells": [
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "# 20春_Web数据挖掘\n",
    "# 项目2 by 廖汉腾, 许智超\n",
    "* HTTP状态狗 取/存图片及img alt文字\n",
    "* 豆瓣电影排行榜\n",
    "* 再试试运气 \n",
    "   * pandas [pandas.read_html()](https://pandas.pydata.org/pandas-docs/stable/reference/api/pandas.read_html.html)取出数据说用了lxml\n",
    "   *  \n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "metadata": {},
   "outputs": [],
   "source": [
    "URL_src = { \"HTTP状态狗\" : \"https://httpstatusdogs.com/\",\n",
    "           \"豆瓣电影排行榜\" : \"https://movie.douban.com/chart\"  }"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## 项目2A. HTTP状态狗\n",
    "### pd.read_html 试运气"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "metadata": {},
   "outputs": [
    {
     "ename": "HTTPError",
     "evalue": "HTTP Error 403: Forbidden",
     "output_type": "error",
     "traceback": [
      "\u001b[1;31m---------------------------------------------------------------------------\u001b[0m",
      "\u001b[1;31mHTTPError\u001b[0m                                 Traceback (most recent call last)",
      "\u001b[1;32m<ipython-input-4-4fc2a0c5adf2>\u001b[0m in \u001b[0;36m<module>\u001b[1;34m\u001b[0m\n\u001b[0;32m      1\u001b[0m \u001b[1;32mimport\u001b[0m \u001b[0mpandas\u001b[0m \u001b[1;32mas\u001b[0m \u001b[0mpd\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[1;32m----> 2\u001b[1;33m \u001b[0mdf\u001b[0m \u001b[1;33m=\u001b[0m \u001b[0mpd\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mread_html\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mURL_src\u001b[0m\u001b[1;33m[\u001b[0m\u001b[1;34m'HTTP状态狗'\u001b[0m\u001b[1;33m]\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0mencoding\u001b[0m\u001b[1;33m=\u001b[0m\u001b[1;34m\"utf8\"\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0mheader\u001b[0m\u001b[1;33m=\u001b[0m\u001b[1;36m0\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0mindex_col\u001b[0m\u001b[1;33m=\u001b[0m\u001b[1;36m0\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0m",
      "\u001b[1;32mC:\\ProgramData\\Anaconda3\\lib\\site-packages\\pandas\\io\\html.py\u001b[0m in \u001b[0;36mread_html\u001b[1;34m(io, match, flavor, header, index_col, skiprows, attrs, parse_dates, thousands, encoding, decimal, converters, na_values, keep_default_na, displayed_only)\u001b[0m\n\u001b[0;32m   1103\u001b[0m         \u001b[0mna_values\u001b[0m\u001b[1;33m=\u001b[0m\u001b[0mna_values\u001b[0m\u001b[1;33m,\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m   1104\u001b[0m         \u001b[0mkeep_default_na\u001b[0m\u001b[1;33m=\u001b[0m\u001b[0mkeep_default_na\u001b[0m\u001b[1;33m,\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[1;32m-> 1105\u001b[1;33m         \u001b[0mdisplayed_only\u001b[0m\u001b[1;33m=\u001b[0m\u001b[0mdisplayed_only\u001b[0m\u001b[1;33m,\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0m\u001b[0;32m   1106\u001b[0m     )\n",
      "\u001b[1;32mC:\\ProgramData\\Anaconda3\\lib\\site-packages\\pandas\\io\\html.py\u001b[0m in \u001b[0;36m_parse\u001b[1;34m(flavor, io, match, attrs, encoding, displayed_only, **kwargs)\u001b[0m\n\u001b[0;32m    910\u001b[0m             \u001b[1;32mbreak\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m    911\u001b[0m     \u001b[1;32melse\u001b[0m\u001b[1;33m:\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[1;32m--> 912\u001b[1;33m         \u001b[0mraise_with_traceback\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mretained\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0m\u001b[0;32m    913\u001b[0m \u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m    914\u001b[0m     \u001b[0mret\u001b[0m \u001b[1;33m=\u001b[0m \u001b[1;33m[\u001b[0m\u001b[1;33m]\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n",
      "\u001b[1;32mC:\\ProgramData\\Anaconda3\\lib\\site-packages\\pandas\\compat\\__init__.py\u001b[0m in \u001b[0;36mraise_with_traceback\u001b[1;34m(exc, traceback)\u001b[0m\n\u001b[0;32m     44\u001b[0m     \u001b[1;32mif\u001b[0m \u001b[0mtraceback\u001b[0m \u001b[1;33m==\u001b[0m \u001b[0mEllipsis\u001b[0m\u001b[1;33m:\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m     45\u001b[0m         \u001b[0m_\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0m_\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0mtraceback\u001b[0m \u001b[1;33m=\u001b[0m \u001b[0msys\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mexc_info\u001b[0m\u001b[1;33m(\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[1;32m---> 46\u001b[1;33m     \u001b[1;32mraise\u001b[0m \u001b[0mexc\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mwith_traceback\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mtraceback\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0m\u001b[0;32m     47\u001b[0m \u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m     48\u001b[0m \u001b[1;33m\u001b[0m\u001b[0m\n",
      "\u001b[1;31mHTTPError\u001b[0m: HTTP Error 403: Forbidden"
     ]
    }
   ],
   "source": [
    "import pandas as pd\n",
    "df = pd.read_html(URL_src['HTTP状态狗'], encoding=\"utf8\", header=0, index_col=0)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### 😱 HTTP Error 403: Forbidden\n",
    "####  上面出现了反爬？？因为它认为我们不是浏览器？？无法查询\n",
    "\n",
    "### 改试 requests + lxml  （假装我们是浏览器）"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "200 b'<!doctype html>\\n<html lang=\"en\">\\n<head>\\n<meta charset=\"utf-8\" />\\n<meta http-equiv=\"X-UA-Compatible\" content=\"IE=edge,chrome=1\" />\\n<title>HTTP Status Dogs</title>\\n<meta name=\"rating\" content=\"general\" />\\n<meta name=\"subject\" content=\"Hypertext Transfer Protocol Response status codes. And dogs.\" />\\n<meta name=\"author\" content=\"Mike Lee\" />\\n<meta name=\"publisher\" content=\"HTTP Status Dogs\" />\\n<meta name=\"copyright\" content=\"Mike Lee\" />\\n<meta name=\"host\" content=\"httpstatusdogs.com\" />\\n<meta name=\"description\" content=\"HTTP Status Dogs. Hypertext Transfer Protocol Response status codes. And dogs.\" />\\n<meta name=\"viewport\" content=\"width=device-width, initial-scale=1\">\\n<meta property=\"og:type\" content=\"website\" />\\n<meta property=\"og:title\" content=\"HTTP Status Dogs\" />\\n<meta property=\"og:description\" content=\"HTTP Status Dogs. Hypertext Transfer Protocol Response status codes. And dogs.\" />\\n<meta property=\"og:image\" content=\"https://httpstatusdogs.com/img/200.jpg\" />\\n<meta property=\"og:site_name\" content=\"HTTP Status Dogs\" />\\n<meta property=\"og:url\" content=\"https://httpstatusdogs.com/\" />\\n<meta name=\"twitter:card\" content=\"summary_large_image\" />\\n<meta name=\"twitter:title\" content=\"HTTP Status Dogs\" />\\n<meta name=\"twitter:description\" content=\"HTTP Status Dogs. Hypertext Transfer Protocol Response status codes. And dogs.\" />\\n<meta name=\"twitter:image\" content=\"https://httpstatusdogs.com/img/200.jpg\" />\\n<meta name=\"twitter:site\" content=\"@mikeeleorg\" />\\n<meta name=\"twitter:creator\" content=\"@mikeeleorg\" />\\n<link rel=\"canonical\" href=\"https://httpstatusdogs.com/\" />\\n<link rel=\"apple-touch-icon\" href=\"apple-touch-icon.png\">\\n<link rel=\"icon\" href=\"https://httpstatusdogs.com/img/paw-32x32.png\" sizes=\"32x32\" type=\"image/png\">\\n<link rel=\"icon\" href=\"https://httpstatusdogs.com/img/paw-48x48.png\" sizes=\"48x48\" type=\"image/png\">\\n<link rel=\"icon\" href=\"https://httpstatusdogs.com/img/paw-62x62.png\" sizes=\"62x62\" type=\"image/png\">\\n<link rel=\"icon\" href=\"https://httpstatusdogs.com/img/paw-192x192.png\" sizes=\"192x192\" type=\"image/png\">\\n<link rel=\"stylesheet\" href=\"https://maxcdn.bootstrapcdn.com/bootstrap/4.0.0-beta/css/bootstrap.min.css\" integrity=\"sha384-/Y6pD6FV/Vv2HJnA6t+vslU6fwYXjCFtcEpHbNJ0lyAFsXTsjBbfaDjzALeQsN6M\" crossorigin=\"anonymous\">\\n<link rel=\"stylesheet\" href=\"/css/styles.css\">\\n<script>\\n\\n  (function(i,s,o,g,r,a,m){i[\\'GoogleAnalyticsObject\\']=r;i[r]=i[r]||function(){\\n  (i[r].q=i[r].q||[]).push(arguments)},i[r].l=1*new Date();a=s.createElement(o),\\n  m=s.getElementsByTagName(o)[0];a.async=1;a.src=g;m.parentNode.insertBefore(a,m)\\n  })(window,document,\\'script\\',\\'https://www.google-analytics.com/analytics.js\\',\\'ga\\');\\n  ga(\\'create\\', \\'UA-316713-16\\', \\'auto\\');\\n  ga(\\'send\\', \\'pageview\\');\\n\\n  </script>\\n</head>\\n<body itemscope itemtype=\"http://schema.org/APIReference\">\\n<header class=\"container-fluid\">\\n<div class=\"row\">\\n<div class=\"col-md-8\">\\n<h1 class=\"site-name\" itemprop=\"author\"><a href=\"https://httpstatusdogs.com/\" itemprop=\"url\">HTTP Status Dogs</a></h1>\\n<h2 class=\"tagline\" itemprop=\"about\">Hypertext Transfer Protocol Response status codes. And dogs.</h2>\\n</div>\\n<div class=\"col-md-4 inspiration\">\\n<div>Inspired by the <a href=\"https://www.flickr.com/photos/girliemac/sets/72157628409467125\">HTTP Status Cats</a> from <a href=\"https://twitter.com/girlie_mac\">@girlie_mac</a> :)</div>\\n</div>\\n</div>\\n</header>\\n<hr>\\n<main class=\"container-fluid\">\\n<div class=\"row\">\\n<div class=\"col-lg-3 col-md-4 col-sm-6 col-xs-12\">\\n<a href=\"100-continue\" class=\"thumbnail\"><img src=\"img/100.jpg\" alt=\"100 Continue\"></a>\\n</div>\\n<div class=\"col-lg-3 col-md-4 col-sm-6 col-xs-12\">\\n<a href=\"200-ok\" class=\"thumbnail\"><img src=\"img/200.jpg\" alt=\"200 OK\"></a>\\n</div>\\n<div class=\"col-lg-3 col-md-4 col-sm-6 col-xs-12\">\\n<a href=\"201-created\" class=\"thumbnail\"><img src=\"img/201.jpg\" alt=\"201 Created\"></a>\\n</div>\\n<div class=\"col-lg-3 col-md-4 col-sm-6 col-xs-12\">\\n<a href=\"202-accepted\" class=\"thumbnail\"><img src=\"img/202.jpg\" alt=\"202 Accepted\"></a>\\n</div>\\n<div class=\"col-lg-3 col-md-4 col-sm-6 col-xs-12\">\\n<a href=\"203-non-authoritative-information\" class=\"thumbnail\"><img src=\"img/203.jpg\" alt=\"203 Non-Authoritative Information\"></a>\\n</div>\\n<div class=\"col-lg-3 col-md-4 col-sm-6 col-xs-12\">\\n<a href=\"204-no-content\" class=\"thumbnail\"><img src=\"img/204.jpg\" alt=\"204 No Content\"></a>\\n</div>\\n<div class=\"col-lg-3 col-md-4 col-sm-6 col-xs-12\">\\n<a href=\"206-partial-content\" class=\"thumbnail\"><img src=\"img/206.jpg\" alt=\"206 Partial Content\"></a>\\n</div>\\n<div class=\"col-lg-3 col-md-4 col-sm-6 col-xs-12\">\\n<a href=\"207-multi-status\" class=\"thumbnail\"><img src=\"img/207.jpg\" alt=\"207 Multi-Status\"></a>\\n</div>\\n<div class=\"col-lg-3 col-md-4 col-sm-6 col-xs-12\">\\n<a href=\"208-already-reported\" class=\"thumbnail\"><img src=\"img/208.jpg\" alt=\"208 Already Reported\"></a>\\n</div>\\n<div class=\"col-lg-3 col-md-4 col-sm-6 col-xs-12\">\\n<a href=\"226-im-used\" class=\"thumbnail\"><img src=\"img/226.jpg\" alt=\"226 IM Used\"></a>\\n</div>\\n<div class=\"col-lg-3 col-md-4 col-sm-6 col-xs-12\">\\n<a href=\"300-multiple-choices\" class=\"thumbnail\"><img src=\"img/300.jpg\" alt=\"300 Multiple Choices\"></a>\\n</div>\\n<div class=\"col-lg-3 col-md-4 col-sm-6 col-xs-12\">\\n<a href=\"301-moved-permanently\" class=\"thumbnail\"><img src=\"img/301.jpg\" alt=\"301 Moved Permanently\"></a>\\n</div>\\n<div class=\"col-lg-3 col-md-4 col-sm-6 col-xs-12\">\\n<a href=\"302-found\" class=\"thumbnail\"><img src=\"img/302.jpg\" alt=\"302 Found\"></a>\\n</div>\\n<div class=\"col-lg-3 col-md-4 col-sm-6 col-xs-12\">\\n<a href=\"303-see-other\" class=\"thumbnail\"><img src=\"img/303.jpg\" alt=\"303 See Other\"></a>\\n</div>\\n<div class=\"col-lg-3 col-md-4 col-sm-6 col-xs-12\">\\n<a href=\"304-not-modified\" class=\"thumbnail\"><img src=\"img/304.jpg\" alt=\"304 Not Modified\"></a>\\n</div>\\n<div class=\"col-lg-3 col-md-4 col-sm-6 col-xs-12\">\\n<a href=\"305-use-proxy\" class=\"thumbnail\"><img src=\"img/305.jpg\" alt=\"305 Use Proxy\"></a>\\n</div>\\n<div class=\"col-lg-3 col-md-4 col-sm-6 col-xs-12\">\\n<a href=\"306-switch-proxy\" class=\"thumbnail\"><img src=\"img/306.jpg\" alt=\"306 Switch Proxy\"></a>\\n</div>\\n<div class=\"col-lg-3 col-md-4 col-sm-6 col-xs-12\">\\n<a href=\"307-temporary-redirect\" class=\"thumbnail\"><img src=\"img/307.jpg\" alt=\"307 Temporary Redirect\"></a>\\n</div>\\n<div class=\"col-lg-3 col-md-4 col-sm-6 col-xs-12\">\\n<a href=\"308-permanent-redirect\" class=\"thumbnail\"><img src=\"img/308.jpg\" alt=\"308 Permanent Redirect\"></a>\\n</div>\\n<div class=\"col-lg-3 col-md-4 col-sm-6 col-xs-12\">\\n<a href=\"400-bad-request\" class=\"thumbnail\"><img src=\"img/400.jpg\" alt=\"400 Bad Request\"></a>\\n</div>\\n<div class=\"col-lg-3 col-md-4 col-sm-6 col-xs-12\">\\n<a href=\"401-unauthorized\" class=\"thumbnail\"><img src=\"img/401.jpg\" alt=\"401 Unauthorized\"></a>\\n</div>\\n<div class=\"col-lg-3 col-md-4 col-sm-6 col-xs-12\">\\n<a href=\"402-payment-required\" class=\"thumbnail\"><img src=\"img/402.jpg\" alt=\"402 Payment Required\"></a>\\n</div>\\n<div class=\"col-lg-3 col-md-4 col-sm-6 col-xs-12\">\\n<a href=\"403-forbidden\" class=\"thumbnail\"><img src=\"img/403.jpg\" alt=\"403 Forbidden\"></a>\\n</div>\\n<div class=\"col-lg-3 col-md-4 col-sm-6 col-xs-12\">\\n<a href=\"404-not-found\" class=\"thumbnail\"><img src=\"img/404.jpg\" alt=\"404 Not Found\"></a>\\n</div>\\n<div class=\"col-lg-3 col-md-4 col-sm-6 col-xs-12\">\\n<a href=\"405-method-not-allowed\" class=\"thumbnail\"><img src=\"img/405.jpg\" alt=\"405 Method Not Allowed\"></a>\\n</div>\\n<div class=\"col-lg-3 col-md-4 col-sm-6 col-xs-12\">\\n<a href=\"406-not-acceptable\" class=\"thumbnail\"><img src=\"img/406.jpg\" alt=\"406 Not Acceptable\"></a>\\n</div>\\n<div class=\"col-lg-3 col-md-4 col-sm-6 col-xs-12\">\\n<a href=\"407-proxy-authentication-required\" class=\"thumbnail\"><img src=\"img/407.jpg\" alt=\"407 Proxy Authentication Required\"></a>\\n</div>\\n<div class=\"col-lg-3 col-md-4 col-sm-6 col-xs-12\">\\n<a href=\"408-request-timeout\" class=\"thumbnail\"><img src=\"img/408.jpg\" alt=\"408 Request Timeout\"></a>\\n</div>\\n<div class=\"col-lg-3 col-md-4 col-sm-6 col-xs-12\">\\n<a href=\"409-conflict\" class=\"thumbnail\"><img src=\"img/409.jpg\" alt=\"409 Conflict\"></a>\\n</div>\\n<div class=\"col-lg-3 col-md-4 col-sm-6 col-xs-12\">\\n<a href=\"410-gone\" class=\"thumbnail\"><img src=\"img/410.jpg\" alt=\"410 Gone\"></a>\\n</div>\\n<div class=\"col-lg-3 col-md-4 col-sm-6 col-xs-12\">\\n<a href=\"411-length-required\" class=\"thumbnail\"><img src=\"img/411.jpg\" alt=\"411 Length Required\"></a>\\n</div>\\n<div class=\"col-lg-3 col-md-4 col-sm-6 col-xs-12\">\\n<a href=\"412-precondition-failed\" class=\"thumbnail\"><img src=\"img/412.jpg\" alt=\"412 Precondition Failed\"></a>\\n</div>\\n<div class=\"col-lg-3 col-md-4 col-sm-6 col-xs-12\">\\n<a href=\"413-request-entity-too-large\" class=\"thumbnail\"><img src=\"img/413.jpg\" alt=\"413 Request Entity Too Large\"></a>\\n</div>\\n<div class=\"col-lg-3 col-md-4 col-sm-6 col-xs-12\">\\n<a href=\"414-request-uri-too-long\" class=\"thumbnail\"><img src=\"img/414.jpg\" alt=\"414 Request-URI Too Long\"></a>\\n</div>\\n<div class=\"col-lg-3 col-md-4 col-sm-6 col-xs-12\">\\n<a href=\"416-requested-range-not-satisfiable\" class=\"thumbnail\"><img src=\"img/416.jpg\" alt=\"416 Requested Range Not Satisfiable\"></a>\\n</div>\\n<div class=\"col-lg-3 col-md-4 col-sm-6 col-xs-12\">\\n<a href=\"417-expectation-failed\" class=\"thumbnail\"><img src=\"img/417.jpg\" alt=\"417 Expectation Failed\"></a>\\n</div>\\n<div class=\"col-lg-3 col-md-4 col-sm-6 col-xs-12\">\\n<a href=\"418-im-a-teapot\" class=\"thumbnail\"><img src=\"img/418.jpg\" alt=\"418 I\\'m a teapot\"></a>\\n</div>\\n<div class=\"col-lg-3 col-md-4 col-sm-6 col-xs-12\">\\n<a href=\"420-enhance-your-calm\" class=\"thumbnail\"><img src=\"img/420.jpg\" alt=\"420 Enhance Your Calm\"></a>\\n</div>\\n<div class=\"col-lg-3 col-md-4 col-sm-6 col-xs-12\">\\n<a href=\"422-unprocessable-entity\" class=\"thumbnail\"><img src=\"img/422.jpg\" alt=\"422 Unprocessable Entity\"></a>\\n</div>\\n<div class=\"col-lg-3 col-md-4 col-sm-6 col-xs-12\">\\n<a href=\"423-locked\" class=\"thumbnail\"><img src=\"img/423.jpg\" alt=\"423 Locked\"></a>\\n</div>\\n<div class=\"col-lg-3 col-md-4 col-sm-6 col-xs-12\">\\n<a href=\"424-failed-dependency\" class=\"thumbnail\"><img src=\"img/424.jpg\" alt=\"424 Failed Dependency\"></a>\\n</div>\\n<div class=\"col-lg-3 col-md-4 col-sm-6 col-xs-12\">\\n<a href=\"425-unordered-collection\" class=\"thumbnail\"><img src=\"img/425.jpg\" alt=\"425 Unordered Collection\"></a>\\n</div>\\n<div class=\"col-lg-3 col-md-4 col-sm-6 col-xs-12\">\\n<a href=\"426-upgrade-required\" class=\"thumbnail\"><img src=\"img/426.jpg\" alt=\"426 Upgrade Required\"></a>\\n</div>\\n<div class=\"col-lg-3 col-md-4 col-sm-6 col-xs-12\">\\n<a href=\"429-too-many-requests\" class=\"thumbnail\"><img src=\"img/429.jpg\" alt=\"429 Too Many Requests\"></a>\\n</div>\\n<div class=\"col-lg-3 col-md-4 col-sm-6 col-xs-12\">\\n<a href=\"431-request-header-fields-too-large\" class=\"thumbnail\"><img src=\"img/431.jpg\" alt=\"431 Request Header Fields Too Large\"></a>\\n</div>\\n<div class=\"col-lg-3 col-md-4 col-sm-6 col-xs-12\">\\n<a href=\"444-no-response\" class=\"thumbnail\"><img src=\"img/444.jpg\" alt=\"444 No Response\"></a>\\n</div>\\n<div class=\"col-lg-3 col-md-4 col-sm-6 col-xs-12\">\\n<a href=\"450-blocked-by-windows-parental-controls\" class=\"thumbnail\"><img src=\"img/450.jpg\" alt=\"450 Blocked by Windows Parental Controls\"></a>\\n</div>\\n<div class=\"col-lg-3 col-md-4 col-sm-6 col-xs-12\">\\n<a href=\"451-unavailable-for-legal-reasons\" class=\"thumbnail\"><img src=\"img/451.jpg\" alt=\"451 Unavailable For Legal Reasons\"></a>\\n</div>\\n<div class=\"col-lg-3 col-md-4 col-sm-6 col-xs-12\">\\n<a href=\"494-request-header-too-large\" class=\"thumbnail\"><img src=\"img/494.jpg\" alt=\"494 Request Header Too Large\"></a>\\n</div>\\n<div class=\"col-lg-3 col-md-4 col-sm-6 col-xs-12\">\\n<a href=\"500-internal-server-error\" class=\"thumbnail\"><img src=\"img/500.jpg\" alt=\"500 Internal Server Error\"></a>\\n</div>\\n<div class=\"col-lg-3 col-md-4 col-sm-6 col-xs-12\">\\n<a href=\"501-not-implemented\" class=\"thumbnail\"><img src=\"img/501.jpg\" alt=\"501 Not Implemented\"></a>\\n</div>\\n<div class=\"col-lg-3 col-md-4 col-sm-6 col-xs-12\">\\n<a href=\"502-bad-gateway\" class=\"thumbnail\"><img src=\"img/502.jpg\" alt=\"502 Bad Gateway\"></a>\\n</div>\\n<div class=\"col-lg-3 col-md-4 col-sm-6 col-xs-12\">\\n<a href=\"503-service-unavailable\" class=\"thumbnail\"><img src=\"img/503.jpg\" alt=\"503 Service Unavailable\"></a>\\n</div>\\n<div class=\"col-lg-3 col-md-4 col-sm-6 col-xs-12\">\\n<a href=\"504-gateway-timeout\" class=\"thumbnail\"><img src=\"img/504.jpg\" alt=\"504 Gateway Timeout\"></a>\\n</div>\\n<div class=\"col-lg-3 col-md-4 col-sm-6 col-xs-12\">\\n<a href=\"506-variant-also-negotiates\" class=\"thumbnail\"><img src=\"img/506.jpg\" alt=\"506 Variant Also Negotiates\"></a>\\n</div>\\n<div class=\"col-lg-3 col-md-4 col-sm-6 col-xs-12\">\\n<a href=\"507-insufficient-storage\" class=\"thumbnail\"><img src=\"img/507.jpg\" alt=\"507 Insufficient Storage\"></a>\\n</div>\\n<div class=\"col-lg-3 col-md-4 col-sm-6 col-xs-12\">\\n<a href=\"508-loop-detected\" class=\"thumbnail\"><img src=\"img/508.jpg\" alt=\"508 Loop Detected\"></a>\\n</div>\\n<div class=\"col-lg-3 col-md-4 col-sm-6 col-xs-12\">\\n<a href=\"509-bandwidth-limit-exceeded\" class=\"thumbnail\"><img src=\"img/509.jpg\" alt=\"509 Bandwidth Limit Exceeded\"></a>\\n</div>\\n<div class=\"col-lg-3 col-md-4 col-sm-6 col-xs-12\">\\n<a href=\"510-not-extended\" class=\"thumbnail\"><img src=\"img/510.jpg\" alt=\"510 Not Extended\"></a>\\n</div>\\n</div>\\n</main>\\n<div class=\"paw\"></div>\\n<hr>\\n<footer class=\"container-fluid\">\\n<div class=\"row\">\\n<div class=\"col-md-6\">\\n<p>\\n&copy; Copyright 2020.\\nFrom <a href=\"https://twitter.com/mikeleeorg\">@mikeleeorg</a>.<br>\\nFor more fun:\\n<a href=\"https://csshumor.com/\">CSS Humor</a> &middot;\\n<a href=\"https://doggoipsum.com/\">Doggo Ipsum</a> &middot;\\n<a href=\"https://web20ipsum.com/\">Web 2.0 Ipsum</a> &middot;\\n<a href=\"https://javascriptbabybooks.com/\">JavaScript Baby Books</a>.\\n</p>\\n</div>\\n<div class=\"col-md-6\">\\n<p class=\"social-share\">Ha ha funny, right? Share with your friends!</p>\\n<a href=\"https://twitter.com/share\" class=\"twitter-share-button\" data-via=\"mikeleeorg\">Tweet</a>\\n<div class=\"fb-share-button\" data-layout=\"button_count\" data-mobile-iframe=\"true\"></div>\\n<div class=\"g-plusone\" data-size=\"medium\"></div>\\n<a href=\"//www.reddit.com/submit\" class=\"reddit\" onclick=\"window.location=\\'//www.reddit.com/submit?url=\\' + encodeURIComponent(window.location); return false\"><img src=\"//www.redditstatic.com/spreddit7.gif\" alt=\"submit to reddit\" border=\"0\" /></a>\\n</div>\\n</div>\\n</footer>\\n<div id=\"fb-root\"></div>\\n<script src=\"https://code.jquery.com/jquery-3.2.1.slim.min.js\" integrity=\"sha256-k2WSCIexGzOj3Euiig+TlR8gA0EmPjuc79OEeY5L45g=\" crossorigin=\"anonymous\"></script>\\n<script>\\n\\njQuery(document).ready(function($) {\\n  $(document).keydown(function(e) {\\n    if (e.which == 39) { location.href = $(\".next a\").attr(\"href\"); e.preventDefault(); }\\n    if (e.which == 37) { location.href = $(\".previous a\").attr(\"href\"); e.preventDefault(); }\\n  })\\n});\\n\\n!function(d,s,id){var js,fjs=d.getElementsByTagName(s)[0],p=/^http:/.test(d.location)?\\'http\\':\\'https\\';if(!d.getElementById(id)){js=d.createElement(s);js.id=id;js.src=p+\\'://platform.twitter.com/widgets.js\\';fjs.parentNode.insertBefore(js,fjs);}}(document, \\'script\\', \\'twitter-wjs\\');\\n\\n(function(d, s, id) {\\n  var js, fjs = d.getElementsByTagName(s)[0];\\n  if (d.getElementById(id)) return;\\n  js = d.createElement(s); js.id = id;\\n  js.src = \"//connect.facebook.net/en_US/sdk.js#xfbml=1&version=v2.6&appId=261169337249871\";\\n  fjs.parentNode.insertBefore(js, fjs);\\n}(document, \\'script\\', \\'facebook-jssdk\\'));\\n\\n</script>\\n<script src=\"https://apis.google.com/js/platform.js\" async defer></script>\\n</body>\\n</html>\\n'\n"
     ]
    }
   ],
   "source": [
    "import requests\n",
    "r = requests.get(URL_src['HTTP状态狗'])\n",
    "print (r.status_code, r.content)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### 😉 HTTP 200  OK\n",
    "![418](https://httpstatusdogs.com/img/200.jpg)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "###  lxml + chrome\n",
    "接下来需要选择器selector抽取数据img，借用HTML的\"结构\"性(chrome要从页面选到结构，你懂的)，有两种可能，必记下来\n",
    "* xpath \n",
    "* CSS selector\n",
    "\n",
    "试第一个和另一个，看看有什麽规律 (侦探活)\n",
    "Chrome Console下使用Javascript\n",
    "* xpath: \n",
    "```$x('放這')```\n",
    "\n",
    "* CSS: \n",
    "```$('放這')```\n",
    "    "
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "* xpath\n",
    "  * /html/body/main/div/div[2]/a/img\n",
    "  * /html/body/main/div/div[23]/a/img\n",
    "* CSS\n",
    "  * body > main > div > div:nth-child(2) > a > img\n",
    "  * body > main > div > div:nth-child(23) > a > img\n",
    "  \n",
    "推论: xpath [2] [23] 移掉,   CSS  (2)  (23) 移掉\n",
    "\n",
    "* $x(\"/html/body/main/div/div/a/img\")\n",
    "* $(\"body > main > div > div > a > img\")\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "[<Element img at 0x1f0bba82e58>, <Element img at 0x1f0bba82ae8>, <Element img at 0x1f0bba82958>, <Element img at 0x1f0bba82908>, <Element img at 0x1f0bba82ef8>, <Element img at 0x1f0bba82d68>, <Element img at 0x1f0bba82db8>, <Element img at 0x1f0bba82b38>, <Element img at 0x1f0bba829f8>, <Element img at 0x1f0bba82c78>, <Element img at 0x1f0bc079b88>, <Element img at 0x1f0bc0794a8>, <Element img at 0x1f0bc0798b8>, <Element img at 0x1f0bc097f98>, <Element img at 0x1f0bc097ef8>, <Element img at 0x1f0bc097ea8>, <Element img at 0x1f0bc09d138>, <Element img at 0x1f0bc09d0e8>, <Element img at 0x1f0bc0ad778>, <Element img at 0x1f0bc0ad638>, <Element img at 0x1f0bc0ad138>, <Element img at 0x1f0bc0bed68>, <Element img at 0x1f0bc0a4ae8>, <Element img at 0x1f0bc0c3278>, <Element img at 0x1f0bc0c32c8>, <Element img at 0x1f0bc0c36d8>, <Element img at 0x1f0bc0c3318>, <Element img at 0x1f0bc0c3728>, <Element img at 0x1f0bc0c3778>, <Element img at 0x1f0bc0c37c8>, <Element img at 0x1f0bc0c3818>, <Element img at 0x1f0bc0c3868>, <Element img at 0x1f0bc0c38b8>, <Element img at 0x1f0bc0c3908>, <Element img at 0x1f0bc0c3958>, <Element img at 0x1f0bc0c39a8>, <Element img at 0x1f0bc0c39f8>, <Element img at 0x1f0bc0c3a48>, <Element img at 0x1f0bc0c3a98>, <Element img at 0x1f0bc0c3ae8>, <Element img at 0x1f0bc0c3b38>, <Element img at 0x1f0bc0c3b88>, <Element img at 0x1f0bc0c3bd8>, <Element img at 0x1f0bc0c3c28>, <Element img at 0x1f0bc0c3c78>, <Element img at 0x1f0bc0c3cc8>, <Element img at 0x1f0bc0c3d18>, <Element img at 0x1f0bc0c3d68>, <Element img at 0x1f0bc0c3db8>, <Element img at 0x1f0bc0c3e08>, <Element img at 0x1f0bc0c3e58>, <Element img at 0x1f0bc0c3ea8>, <Element img at 0x1f0bc0c3ef8>, <Element img at 0x1f0bc0c3f48>, <Element img at 0x1f0bc0c3f98>, <Element img at 0x1f0bc0d6048>, <Element img at 0x1f0bc0d6098>, <Element img at 0x1f0bc0d60e8>, <Element img at 0x1f0bc0d6138>]\n"
     ]
    }
   ],
   "source": [
    "import lxml\n",
    "text_data = r.content\n",
    "tree = lxml.html.fromstring(text_data)  # 当成片语/成语记下来  lxml模块下的html处理子物件模块，从字符串转成html物件tree\n",
    "树 = lxml.html.fromstring(text_data)  # 用中文当变数名也行, 试给你看, 和上面的代码二选一就可以\n",
    "HTTP状态狗 = 树.xpath(\"/html/body/main/div/div/a/img\")  # 当成片语/成语记下来, html物件树，有方法xpath抽数据出来\n",
    "print ( HTTP状态狗 )"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "'100 Continue'"
      ]
     },
     "execution_count": 5,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "a = HTTP状态狗[0]  #  https://lxml.de/3.1/api/private/lxml.html.HtmlElement-class.html\n",
    "a.get(\"alt\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 6,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "['100 Continue', '200 OK', '201 Created', '202 Accepted', '203 Non-Authoritative Information', '204 No Content', '206 Partial Content', '207 Multi-Status', '208 Already Reported', '226 IM Used', '300 Multiple Choices', '301 Moved Permanently', '302 Found', '303 See Other', '304 Not Modified', '305 Use Proxy', '306 Switch Proxy', '307 Temporary Redirect', '308 Permanent Redirect', '400 Bad Request', '401 Unauthorized', '402 Payment Required', '403 Forbidden', '404 Not Found', '405 Method Not Allowed', '406 Not Acceptable', '407 Proxy Authentication Required', '408 Request Timeout', '409 Conflict', '410 Gone', '411 Length Required', '412 Precondition Failed', '413 Request Entity Too Large', '414 Request-URI Too Long', '416 Requested Range Not Satisfiable', '417 Expectation Failed', \"418 I'm a teapot\", '420 Enhance Your Calm', '422 Unprocessable Entity', '423 Locked', '424 Failed Dependency', '425 Unordered Collection', '426 Upgrade Required', '429 Too Many Requests', '431 Request Header Fields Too Large', '444 No Response', '450 Blocked by Windows Parental Controls', '451 Unavailable For Legal Reasons', '494 Request Header Too Large', '500 Internal Server Error', '501 Not Implemented', '502 Bad Gateway', '503 Service Unavailable', '504 Gateway Timeout', '506 Variant Also Negotiates', '507 Insufficient Storage', '508 Loop Detected', '509 Bandwidth Limit Exceeded', '510 Not Extended']\n"
     ]
    }
   ],
   "source": [
    "# 用列表推導 公式 [ x做些啥 for x in 列表]\n",
    "# 抽 element img 裡的 alt文字\n",
    "list_img_alt = [ x.get(\"alt\") for x in HTTP状态狗]\n",
    "print (list_img_alt)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 7,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "['img/100.jpg', 'img/200.jpg', 'img/201.jpg', 'img/202.jpg', 'img/203.jpg', 'img/204.jpg', 'img/206.jpg', 'img/207.jpg', 'img/208.jpg', 'img/226.jpg', 'img/300.jpg', 'img/301.jpg', 'img/302.jpg', 'img/303.jpg', 'img/304.jpg', 'img/305.jpg', 'img/306.jpg', 'img/307.jpg', 'img/308.jpg', 'img/400.jpg', 'img/401.jpg', 'img/402.jpg', 'img/403.jpg', 'img/404.jpg', 'img/405.jpg', 'img/406.jpg', 'img/407.jpg', 'img/408.jpg', 'img/409.jpg', 'img/410.jpg', 'img/411.jpg', 'img/412.jpg', 'img/413.jpg', 'img/414.jpg', 'img/416.jpg', 'img/417.jpg', 'img/418.jpg', 'img/420.jpg', 'img/422.jpg', 'img/423.jpg', 'img/424.jpg', 'img/425.jpg', 'img/426.jpg', 'img/429.jpg', 'img/431.jpg', 'img/444.jpg', 'img/450.jpg', 'img/451.jpg', 'img/494.jpg', 'img/500.jpg', 'img/501.jpg', 'img/502.jpg', 'img/503.jpg', 'img/504.jpg', 'img/506.jpg', 'img/507.jpg', 'img/508.jpg', 'img/509.jpg', 'img/510.jpg']\n"
     ]
    }
   ],
   "source": [
    "# 抽 url, src\n",
    "list_img_src = [ x.get(\"src\") for x in HTTP状态狗]\n",
    "print (list_img_src)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 11,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "'https://httpstatusdogs.com/img/100.jpg'"
      ]
     },
     "execution_count": 11,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# 是相對位置, 記得要和网站位置合起來使用\n",
    "# 合起來的方法, 記得使用  urllib.parse.urljoin\n",
    "# 网站位置可以用http request的反嚮 response.url, 這裡剛是叫r的變量\n",
    "\n",
    "import urllib.parse\n",
    "# urllib.parse.urljoin(url1, url2)\n",
    "\n",
    "url_base = r.url\n",
    "urllib.parse.urljoin( url_base, list_img_src[0])"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "#### 下图片\n",
    "* 备好目录 (!mkdir 目录) 不是Python代码, 是系统shell\n",
    "* 用requests存raw, 而非文字\n",
    "* [How to download image using requests](https://stackoverflow.com/questions/13137817/how-to-download-image-using-requests)\n",
    "* 以后再细说, 这下载要花点时间"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 12,
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "子目录或文件 img 已经存在。\n"
     ]
    }
   ],
   "source": [
    "!mkdir img"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 13,
   "metadata": {},
   "outputs": [],
   "source": [
    "import requests\n",
    "import shutil\n",
    "\n",
    "for imgfilename in list_img_src:\n",
    "    path = urllib.parse.urljoin( url_base, imgfilename)\n",
    "    \n",
    "    resp = requests.get(path, stream=True)\n",
    "    if r.status_code == 200:\n",
    "        with open(imgfilename, mode=\"wb\") as f:    # mode = write binary\n",
    "            resp.raw.decode_content = True\n",
    "            shutil.copyfileobj(resp.raw, f) \n",
    "    del resp\n",
    "            \n",
    "# 有些下载okay有些不行, 见img"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## 项目2B. 豆瓣电影排行榜\n",
    "### pd.read_html 试运气"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 14,
   "metadata": {},
   "outputs": [
    {
     "ename": "HTTPError",
     "evalue": "HTTP Error 418: ",
     "output_type": "error",
     "traceback": [
      "\u001b[1;31m---------------------------------------------------------------------------\u001b[0m",
      "\u001b[1;31mHTTPError\u001b[0m                                 Traceback (most recent call last)",
      "\u001b[1;32m<ipython-input-14-1d6d73990aab>\u001b[0m in \u001b[0;36m<module>\u001b[1;34m\u001b[0m\n\u001b[0;32m      1\u001b[0m \u001b[1;32mimport\u001b[0m \u001b[0mpandas\u001b[0m \u001b[1;32mas\u001b[0m \u001b[0mpd\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[1;32m----> 2\u001b[1;33m \u001b[0mdf\u001b[0m \u001b[1;33m=\u001b[0m \u001b[0mpd\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mread_html\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mURL_src\u001b[0m\u001b[1;33m[\u001b[0m\u001b[1;34m'豆瓣电影排行榜'\u001b[0m\u001b[1;33m]\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0mencoding\u001b[0m\u001b[1;33m=\u001b[0m\u001b[1;34m\"utf8\"\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0mheader\u001b[0m\u001b[1;33m=\u001b[0m\u001b[1;36m0\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0mindex_col\u001b[0m\u001b[1;33m=\u001b[0m\u001b[1;36m0\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0m",
      "\u001b[1;32mC:\\ProgramData\\Anaconda3\\lib\\site-packages\\pandas\\io\\html.py\u001b[0m in \u001b[0;36mread_html\u001b[1;34m(io, match, flavor, header, index_col, skiprows, attrs, parse_dates, thousands, encoding, decimal, converters, na_values, keep_default_na, displayed_only)\u001b[0m\n\u001b[0;32m   1103\u001b[0m         \u001b[0mna_values\u001b[0m\u001b[1;33m=\u001b[0m\u001b[0mna_values\u001b[0m\u001b[1;33m,\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m   1104\u001b[0m         \u001b[0mkeep_default_na\u001b[0m\u001b[1;33m=\u001b[0m\u001b[0mkeep_default_na\u001b[0m\u001b[1;33m,\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[1;32m-> 1105\u001b[1;33m         \u001b[0mdisplayed_only\u001b[0m\u001b[1;33m=\u001b[0m\u001b[0mdisplayed_only\u001b[0m\u001b[1;33m,\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0m\u001b[0;32m   1106\u001b[0m     )\n",
      "\u001b[1;32mC:\\ProgramData\\Anaconda3\\lib\\site-packages\\pandas\\io\\html.py\u001b[0m in \u001b[0;36m_parse\u001b[1;34m(flavor, io, match, attrs, encoding, displayed_only, **kwargs)\u001b[0m\n\u001b[0;32m    910\u001b[0m             \u001b[1;32mbreak\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m    911\u001b[0m     \u001b[1;32melse\u001b[0m\u001b[1;33m:\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[1;32m--> 912\u001b[1;33m         \u001b[0mraise_with_traceback\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mretained\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0m\u001b[0;32m    913\u001b[0m \u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m    914\u001b[0m     \u001b[0mret\u001b[0m \u001b[1;33m=\u001b[0m \u001b[1;33m[\u001b[0m\u001b[1;33m]\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n",
      "\u001b[1;32mC:\\ProgramData\\Anaconda3\\lib\\site-packages\\pandas\\compat\\__init__.py\u001b[0m in \u001b[0;36mraise_with_traceback\u001b[1;34m(exc, traceback)\u001b[0m\n\u001b[0;32m     45\u001b[0m     \u001b[1;32mif\u001b[0m \u001b[0mtraceback\u001b[0m \u001b[1;33m==\u001b[0m \u001b[0mEllipsis\u001b[0m\u001b[1;33m:\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m     46\u001b[0m         \u001b[0m_\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0m_\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0mtraceback\u001b[0m \u001b[1;33m=\u001b[0m \u001b[0msys\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mexc_info\u001b[0m\u001b[1;33m(\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[1;32m---> 47\u001b[1;33m     \u001b[1;32mraise\u001b[0m \u001b[0mexc\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mwith_traceback\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mtraceback\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0m\u001b[0;32m     48\u001b[0m \u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m     49\u001b[0m \u001b[1;33m\u001b[0m\u001b[0m\n",
      "\u001b[1;31mHTTPError\u001b[0m: HTTP Error 418: "
     ]
    }
   ],
   "source": [
    "import pandas as pd\n",
    "df = pd.read_html(URL_src['豆瓣电影排行榜'], encoding=\"utf8\", header=0, index_col=0)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 15,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "418 b''\n"
     ]
    }
   ],
   "source": [
    "import requests\n",
    "r = requests.get(URL_src['豆瓣电影排行榜'])\n",
    "print (r.status_code, r.content)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### 😱 HTTP 418 倒底是啥?  I am a teapot? \n",
    "![418](https://httpstatusdogs.com/img/418.jpg)\n",
    "\n",
    "### 所以要假装自己是浏览器\n",
    "* HTTP headers: Host, User-Agent (简称UA)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### 改试 requests + pd.read_html"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 16,
   "metadata": {},
   "outputs": [],
   "source": [
    "import requests\n",
    "from urllib import parse\n",
    "_headers_ = {\n",
    "        \"Accept\": \"text/plain, */*; q=0.01\", \n",
    "        \"Connection\": \"keep-alive\",\n",
    "        \"Host\" : \"movie.douban.com\", \n",
    "        \"User-Agent\" : \"Mozilla/5.0 (Windows NT 10.0; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/62.0.3250.0 Iron Safari/537.36\",\n",
    "}\n",
    "s = requests.Session()\n",
    "u = URL_src['豆瓣电影排行榜']\n",
    "r = s.get(u, headers=_headers_)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 17,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "200 b'<!DOCTYPE html>\\n<html lang=\"zh-cmn-Hans\" class=\"ua-windows ua-webkit\">\\n<head>\\n    <meta http-equiv=\"Content-Type\" content=\"text/html; charset=utf-8\">\\n    <meta name=\"renderer\" content=\"webkit\">\\n    <meta name=\"referrer\" content=\"always\">\\n    <meta name=\"google-site-verification\" content=\"ok0wCgT20tBBgo9_zat2iAcimtN4Ftf5ccsh092Xeyw\" />\\n    <title>\\n\\xe8\\xb1\\x86\\xe7\\x93\\xa3\\xe7\\x94\\xb5\\xe5\\xbd\\xb1\\xe6\\x8e\\x92\\xe8\\xa1\\x8c\\xe6\\xa6\\x9c\\n</title>\\n    \\n    <meta name=\"baidu-site-verification\" content=\"cZdR4xxR7RxmM4zE\" />\\n    <meta http-equiv=\"Pragma\" content=\"no-cache\">\\n    <meta http-equiv=\"Expires\" content=\"Sun, 6 Mar 2005 01:00:00 GMT\">\\n    \\n    <meta name=\"keywords\" content=\"\\xe7\\x94\\xb5\\xe5\\xbd\\xb1\\xe6\\x8e\\x92\\xe8\\xa1\\x8c\\xe6\\xa6\\x9c\\xe3\\x80\\x81\\xe6\\x96\\xb0\\xe7\\x89\\x87\\xe6\\x8e\\x92\\xe8\\xa1\\x8c\\xe6\\xa6\\x9c\\xe3\\x80\\x81\\xe8\\xb1\\x86\\xe7\\x93\\xa3\\xe7\\x94\\xb5\\xe5\\xbd\\xb1250\"/>\\n    <meta name=\"description\" content=\"\\xe8\\xb1\\x86\\xe7\\x93\\xa3\\xe7\\x94\\xb5\\xe5\\xbd\\xb1\\xe6\\x8e\\x92\\xe8\\xa1\\x8c\\xe6\\xa6\\x9c,\\xe6\\x8f\\x90\\xe4\\xbe\\x9b\\xe6\\x9c\\x80\\xe6\\x96\\xb0\\xe7\\x94\\xb5\\xe5\\xbd\\xb1\\xe6\\x8e\\x92\\xe8\\xa1\\x8c\\xe6\\xa6\\x9c\\xe3\\x80\\x81\\xe6\\x9c\\xac\\xe5\\x91\\xa8\\xe7\\x94\\xb5\\xe5\\xbd\\xb1\\xe5\\x8f\\xa3\\xe7\\xa2\\x91\\xe6\\xa6\\x9c\\xe5\\x92\\x8c\\xe8\\xb1\\x86\\xe7\\x93\\xa3\\xe7\\x94\\xb5\\xe5\\xbd\\xb1TOP250\" />\\n\\n    <link rel=\"apple-touch-icon\" href=\"https://img3.doubanio.com/f/movie/d59b2715fdea4968a450ee5f6c95c7d7a2030065/pics/movie/apple-touch-icon.png\">\\n    <link href=\"https://img3.doubanio.com/f/shire/3e5dfc68b0f376484c50cf08a58bbca3700911dc/css/douban.css\" rel=\"stylesheet\" type=\"text/css\">\\n    <link href=\"https://img3.doubanio.com/f/shire/ae3f5a3e3085968370b1fc63afcecb22d3284848/css/separation/_all.css\" rel=\"stylesheet\" type=\"text/css\">\\n    <link href=\"https://img3.doubanio.com/f/movie/8864d3756094f5272d3c93e30ee2e324665855b0/css/movie/base/init.css\" rel=\"stylesheet\">\\n    <script type=\"text/javascript\">var _head_start = new Date();</script>\\n    <script type=\"text/javascript\" src=\"https://img3.doubanio.com/f/movie/0495cb173e298c28593766009c7b0a953246c5b5/js/movie/lib/jquery.js\"></script>\\n    <script type=\"text/javascript\" src=\"https://img3.doubanio.com/f/shire/5ecaf46d6954d5a30bc7d99be86ae34031646e00/js/douban.js\"></script>\\n    <script type=\"text/javascript\" src=\"https://img3.doubanio.com/f/shire/0efdc63b77f895eaf85281fb0e44d435c6239a3f/js/separation/_all.js\"></script>\\n    \\n    <style type=\"text/css\"></style>\\n    <style type=\"text/css\">img { max-width: 100%; }</style>\\n    <script type=\"text/javascript\"></script>\\n    <link rel=\"stylesheet\" href=\"https://img3.doubanio.com/misc/mixed_static/7014746226b5bef9.css\">\\n\\n    <link rel=\"shortcut icon\" href=\"https://img3.doubanio.com/favicon.ico\" type=\"image/x-icon\">\\n</head>\\n\\n<body>\\n  \\n    <script type=\"text/javascript\">var _body_start = new Date();</script>\\n\\n    \\n    \\n\\n\\n\\n    <link href=\"//img3.doubanio.com/dae/accounts/resources/f5f3d66/shire/bundle.css\" rel=\"stylesheet\" type=\"text/css\">\\n\\n\\n\\n<div id=\"db-global-nav\" class=\"global-nav\">\\n  <div class=\"bd\">\\n    \\n<div class=\"top-nav-info\">\\n  <a href=\"https://accounts.douban.com/passport/login?source=movie\" class=\"nav-login\" rel=\"nofollow\">\\xe7\\x99\\xbb\\xe5\\xbd\\x95/\\xe6\\xb3\\xa8\\xe5\\x86\\x8c</a>\\n</div>\\n\\n\\n    <div class=\"top-nav-doubanapp\">\\n  <a href=\"https://www.douban.com/doubanapp/app?channel=top-nav\" class=\"lnk-doubanapp\">\\xe4\\xb8\\x8b\\xe8\\xbd\\xbd\\xe8\\xb1\\x86\\xe7\\x93\\xa3\\xe5\\xae\\xa2\\xe6\\x88\\xb7\\xe7\\xab\\xaf</a>\\n  <div id=\"doubanapp-tip\">\\n    <a href=\"https://www.douban.com/doubanapp/app?channel=qipao\" class=\"tip-link\">\\xe8\\xb1\\x86\\xe7\\x93\\xa3 <span class=\"version\">6.0</span> \\xe5\\x85\\xa8\\xe6\\x96\\xb0\\xe5\\x8f\\x91\\xe5\\xb8\\x83</a>\\n    <a href=\"javascript: void 0;\" class=\"tip-close\">\\xc3\\x97</a>\\n  </div>\\n  <div id=\"top-nav-appintro\" class=\"more-items\">\\n    <p class=\"appintro-title\">\\xe8\\xb1\\x86\\xe7\\x93\\xa3</p>\\n    <p class=\"qrcode\">\\xe6\\x89\\xab\\xe7\\xa0\\x81\\xe7\\x9b\\xb4\\xe6\\x8e\\xa5\\xe4\\xb8\\x8b\\xe8\\xbd\\xbd</p>\\n    <div class=\"download\">\\n      <a href=\"https://www.douban.com/doubanapp/redirect?channel=top-nav&direct_dl=1&download=iOS\">iPhone</a>\\n      <span>\\xc2\\xb7</span>\\n      <a href=\"https://www.douban.com/doubanapp/redirect?channel=top-nav&direct_dl=1&download=Android\" class=\"download-android\">Android</a>\\n    </div>\\n  </div>\\n</div>\\n\\n    \\n\\n\\n<div class=\"global-nav-items\">\\n  <ul>\\n    <li class=\"\">\\n      <a href=\"https://www.douban.com\" target=\"_blank\" data-moreurl-dict=\"{&quot;from&quot;:&quot;top-nav-click-main&quot;,&quot;uid&quot;:&quot;0&quot;}\">\\xe8\\xb1\\x86\\xe7\\x93\\xa3</a>\\n    </li>\\n    <li class=\"\">\\n      <a href=\"https://book.douban.com\" target=\"_blank\" data-moreurl-dict=\"{&quot;from&quot;:&quot;top-nav-click-book&quot;,&quot;uid&quot;:&quot;0&quot;}\">\\xe8\\xaf\\xbb\\xe4\\xb9\\xa6</a>\\n    </li>\\n    <li class=\"on\">\\n      <a href=\"https://movie.douban.com\"  data-moreurl-dict=\"{&quot;from&quot;:&quot;top-nav-click-movie&quot;,&quot;uid&quot;:&quot;0&quot;}\">\\xe7\\x94\\xb5\\xe5\\xbd\\xb1</a>\\n    </li>\\n    <li class=\"\">\\n      <a href=\"https://music.douban.com\" target=\"_blank\" data-moreurl-dict=\"{&quot;from&quot;:&quot;top-nav-click-music&quot;,&quot;uid&quot;:&quot;0&quot;}\">\\xe9\\x9f\\xb3\\xe4\\xb9\\x90</a>\\n    </li>\\n    <li class=\"\">\\n      <a href=\"https://www.douban.com/location\" target=\"_blank\" data-moreurl-dict=\"{&quot;from&quot;:&quot;top-nav-click-location&quot;,&quot;uid&quot;:&quot;0&quot;}\">\\xe5\\x90\\x8c\\xe5\\x9f\\x8e</a>\\n    </li>\\n    <li class=\"\">\\n      <a href=\"https://www.douban.com/group\" target=\"_blank\" data-moreurl-dict=\"{&quot;from&quot;:&quot;top-nav-click-group&quot;,&quot;uid&quot;:&quot;0&quot;}\">\\xe5\\xb0\\x8f\\xe7\\xbb\\x84</a>\\n    </li>\\n    <li class=\"\">\\n      <a href=\"https://read.douban.com&#47;?dcs=top-nav&amp;dcm=douban\" target=\"_blank\" data-moreurl-dict=\"{&quot;from&quot;:&quot;top-nav-click-read&quot;,&quot;uid&quot;:&quot;0&quot;}\">\\xe9\\x98\\x85\\xe8\\xaf\\xbb</a>\\n    </li>\\n    <li class=\"\">\\n      <a href=\"https://douban.fm&#47;?from_=shire_top_nav\" target=\"_blank\" data-moreurl-dict=\"{&quot;from&quot;:&quot;top-nav-click-fm&quot;,&quot;uid&quot;:&quot;0&quot;}\">FM</a>\\n    </li>\\n    <li class=\"\">\\n      <a href=\"https://time.douban.com&#47;?dt_time_source=douban-web_top_nav\" target=\"_blank\" data-moreurl-dict=\"{&quot;from&quot;:&quot;top-nav-click-time&quot;,&quot;uid&quot;:&quot;0&quot;}\">\\xe6\\x97\\xb6\\xe9\\x97\\xb4</a>\\n    </li>\\n    <li class=\"\">\\n      <a href=\"https://market.douban.com&#47;?utm_campaign=douban_top_nav&amp;utm_source=douban&amp;utm_medium=pc_web\" target=\"_blank\" data-moreurl-dict=\"{&quot;from&quot;:&quot;top-nav-click-market&quot;,&quot;uid&quot;:&quot;0&quot;}\">\\xe8\\xb1\\x86\\xe5\\x93\\x81</a>\\n    </li>\\n    <li>\\n      <a href=\"#more\" class=\"bn-more\"><span>\\xe6\\x9b\\xb4\\xe5\\xa4\\x9a</span></a>\\n      <div class=\"more-items\">\\n        <table cellpadding=\"0\" cellspacing=\"0\">\\n          <tbody>\\n            <tr>\\n              <td>\\n                <a href=\"https://ypy.douban.com\" target=\"_blank\" data-moreurl-dict=\"{&quot;from&quot;:&quot;top-nav-click-ypy&quot;,&quot;uid&quot;:&quot;0&quot;}\">\\xe8\\xb1\\x86\\xe7\\x93\\xa3\\xe6\\x91\\x84\\xe5\\xbd\\xb1</a>\\n              </td>\\n            </tr>\\n          </tbody>\\n        </table>\\n      </div>\\n    </li>\\n  </ul>\\n</div>\\n\\n  </div>\\n</div>\\n<script>\\n  ;window._GLOBAL_NAV = {\\n    DOUBAN_URL: \"https://www.douban.com\",\\n    N_NEW_NOTIS: 0,\\n    N_NEW_DOUMAIL: 0\\n  };\\n</script>\\n\\n\\n\\n    <script src=\"//img3.doubanio.com/dae/accounts/resources/f5f3d66/shire/bundle.js\" defer=\"defer\"></script>\\n\\n\\n\\n\\n    \\n\\n\\n\\n    <link href=\"//img3.doubanio.com/dae/accounts/resources/f5f3d66/movie/bundle.css\" rel=\"stylesheet\" type=\"text/css\">\\n\\n\\n\\n\\n<div id=\"db-nav-movie\" class=\"nav\">\\n  <div class=\"nav-wrap\">\\n  <div class=\"nav-primary\">\\n    <div class=\"nav-logo\">\\n      <a href=\"https:&#47;&#47;movie.douban.com\">\\xe8\\xb1\\x86\\xe7\\x93\\xa3\\xe7\\x94\\xb5\\xe5\\xbd\\xb1</a>\\n    </div>\\n    <div class=\"nav-search\">\\n      <form action=\"https:&#47;&#47;search.douban.com&#47;movie/subject_search\" method=\"get\">\\n        <fieldset>\\n          <legend>\\xe6\\x90\\x9c\\xe7\\xb4\\xa2\\xef\\xbc\\x9a</legend>\\n          <label for=\"inp-query\">\\n          </label>\\n          <div class=\"inp\"><input id=\"inp-query\" name=\"search_text\" size=\"22\" maxlength=\"60\" placeholder=\"\\xe6\\x90\\x9c\\xe7\\xb4\\xa2\\xe7\\x94\\xb5\\xe5\\xbd\\xb1\\xe3\\x80\\x81\\xe7\\x94\\xb5\\xe8\\xa7\\x86\\xe5\\x89\\xa7\\xe3\\x80\\x81\\xe7\\xbb\\xbc\\xe8\\x89\\xba\\xe3\\x80\\x81\\xe5\\xbd\\xb1\\xe4\\xba\\xba\" value=\"\"></div>\\n          <div class=\"inp-btn\"><input type=\"submit\" value=\"\\xe6\\x90\\x9c\\xe7\\xb4\\xa2\"></div>\\n          <input type=\"hidden\" name=\"cat\" value=\"1002\" />\\n        </fieldset>\\n      </form>\\n    </div>\\n  </div>\\n  </div>\\n  <div class=\"nav-secondary\">\\n    \\n\\n<div class=\"nav-items\">\\n  <ul>\\n    <li    ><a href=\"https://movie.douban.com/cinema/nowplaying/\"\\n     >\\xe5\\xbd\\xb1\\xe8\\xae\\xaf&\\xe8\\xb4\\xad\\xe7\\xa5\\xa8</a>\\n    </li>\\n    <li    ><a href=\"https://movie.douban.com/explore\"\\n     >\\xe9\\x80\\x89\\xe7\\x94\\xb5\\xe5\\xbd\\xb1</a>\\n    </li>\\n    <li    ><a href=\"https://movie.douban.com/tv/\"\\n     >\\xe7\\x94\\xb5\\xe8\\xa7\\x86\\xe5\\x89\\xa7</a>\\n    </li>\\n    <li    ><a href=\"https://movie.douban.com/chart\"\\n     >\\xe6\\x8e\\x92\\xe8\\xa1\\x8c\\xe6\\xa6\\x9c</a>\\n    </li>\\n    <li    ><a href=\"https://movie.douban.com/tag/\"\\n     >\\xe5\\x88\\x86\\xe7\\xb1\\xbb</a>\\n    </li>\\n    <li    ><a href=\"https://movie.douban.com/review/best/\"\\n     >\\xe5\\xbd\\xb1\\xe8\\xaf\\x84</a>\\n    </li>\\n    <li    ><a href=\"https://movie.douban.com/annual/2019?source=navigation\"\\n     >2019\\xe5\\xb9\\xb4\\xe5\\xba\\xa6\\xe6\\xa6\\x9c\\xe5\\x8d\\x95</a>\\n    </li>\\n    <li    ><a href=\"https://m.douban.com/standbyme/annual2019?source=navigation\"\\n            target=\"_blank\"\\n     >2019\\xe4\\xb9\\xa6\\xe5\\xbd\\xb1\\xe9\\x9f\\xb3\\xe6\\x8a\\xa5\\xe5\\x91\\x8a</a>\\n    </li>\\n  </ul>\\n</div>\\n\\n    <a href=\"https://movie.douban.com/annual/2019?source=movie_navigation\" class=\"movieannual\"></a>\\n  </div>\\n</div>\\n\\n<script id=\"suggResult\" type=\"text/x-jquery-tmpl\">\\n  <li data-link=\"{{= url}}\">\\n            <a href=\"{{= url}}\" onclick=\"moreurl(this, {from:\\'movie_search_sugg\\', query:\\'{{= keyword }}\\', subject_id:\\'{{= id}}\\', i: \\'{{= index}}\\', type: \\'{{= type}}\\'})\">\\n            <img src=\"{{= img}}\" width=\"40\" />\\n            <p>\\n                <em>{{= title}}</em>\\n                {{if year}}\\n                    <span>{{= year}}</span>\\n                {{/if}}\\n                {{if sub_title}}\\n                    <br /><span>{{= sub_title}}</span>\\n                {{/if}}\\n                {{if address}}\\n                    <br /><span>{{= address}}</span>\\n                {{/if}}\\n                {{if episode}}\\n                    {{if episode==\"unknow\"}}\\n                        <br /><span>\\xe9\\x9b\\x86\\xe6\\x95\\xb0\\xe6\\x9c\\xaa\\xe7\\x9f\\xa5</span>\\n                    {{else}}\\n                        <br /><span>\\xe5\\x85\\xb1{{= episode}}\\xe9\\x9b\\x86</span>\\n                    {{/if}}\\n                {{/if}}\\n            </p>\\n        </a>\\n        </li>\\n  </script>\\n\\n\\n\\n\\n    <script src=\"//img3.doubanio.com/dae/accounts/resources/f5f3d66/movie/bundle.js\" defer=\"defer\"></script>\\n\\n\\n\\n\\n\\n    \\n    <div id=\"wrapper\">\\n        \\n\\n        \\n    <div id=\"content\">\\n        \\n    <h1>\\xe8\\xb1\\x86\\xe7\\x93\\xa3\\xe7\\x94\\xb5\\xe5\\xbd\\xb1\\xe6\\x8e\\x92\\xe8\\xa1\\x8c\\xe6\\xa6\\x9c</h1>\\n\\n        <div class=\"grid-16-8 clearfix\">\\n            \\n            \\n            <div class=\"article\">\\n                \\n    <h2>\\xe8\\xb1\\x86\\xe7\\x93\\xa3\\xe6\\x96\\xb0\\xe7\\x89\\x87\\xe6\\xa6\\x9c   \\xc2\\xb7 \\xc2\\xb7 \\xc2\\xb7 \\xc2\\xb7 \\xc2\\xb7 \\xc2\\xb7 </h2>\\n    <div class=\"indent\">\\n        \\n\\n\\n\\n\\n\\n<div class=\"\">\\n    <p class=\"ul first\"></p>\\n    <table width=\"100%\" class=\"\">\\n        <tr class=\"item\">\\n            <td width=\"100\" valign=\"top\">\\n                \\n\\n                    <a class=\"nbg\" href=\"https://movie.douban.com/subject/30252495/\"  title=\"1917\">\\n                        <img src=\"https://img3.doubanio.com/view/photo/s_ratio_poster/public/p2587146023.jpg\" width=\"75\" alt=\"1917\" class=\"\"/>\\n                    </a>\\n            </td>\\n\\n            <td valign=\"top\">\\n                \\n\\n                <div class=\"pl2\">\\n\\n                    <a href=\"https://movie.douban.com/subject/30252495/\"  class=\"\">\\n                        1917\\n                        / <span style=\"font-size:13px;\">1917\\xef\\xbc\\x9a\\xe9\\x80\\x86\\xe6\\x88\\x98\\xe6\\x95\\x91\\xe5\\x85\\xb5(\\xe6\\xb8\\xaf) / \\xe4\\xb8\\x80\\xe4\\xb9\\x9d\\xe4\\xb8\\x80\\xe4\\xb8\\x83</span>\\n                    </a>\\n\\n\\n\\n                    <p class=\"pl\">2019-12-25(\\xe7\\xbe\\x8e\\xe5\\x9b\\xbd) / 2020-01-10(\\xe8\\x8b\\xb1\\xe5\\x9b\\xbd) / 2020(\\xe4\\xb8\\xad\\xe5\\x9b\\xbd\\xe5\\xa4\\xa7\\xe9\\x99\\x86) / \\xe4\\xb9\\x94\\xe6\\xb2\\xbb\\xc2\\xb7\\xe9\\xba\\xa6\\xe5\\x87\\xaf / \\xe8\\xbf\\xaa\\xe6\\x81\\xa9\\xc2\\xb7\\xe6\\x9f\\xa5\\xe5\\xb0\\x94\\xe6\\x96\\xaf\\xc2\\xb7\\xe6\\x9f\\xa5\\xe6\\x99\\xae\\xe6\\x9b\\xbc / \\xe7\\xa7\\x91\\xe6\\x9e\\x97\\xc2\\xb7\\xe8\\xb4\\xb9\\xe5\\xb0\\x94\\xe6\\x96\\xaf / \\xe6\\x9c\\xac\\xe5\\xb0\\xbc\\xe8\\xbf\\xaa\\xe5\\x85\\x8b\\xe7\\x89\\xb9\\xc2\\xb7\\xe5\\xba\\xb7\\xe4\\xbc\\xaf\\xe5\\xb7\\xb4\\xe5\\xa5\\x87 / \\xe9\\xa9\\xac\\xe5\\x85\\x8b\\xc2\\xb7\\xe6\\x96\\xaf\\xe7\\x89\\xb9\\xe6\\x9c\\x97 / \\xe7\\x90\\x86\\xe6\\x9f\\xa5\\xe5\\xbe\\xb7\\xc2\\xb7\\xe9\\xba\\xa6\\xe7\\x99\\xbb / \\xe5\\xae\\x89\\xe5\\xbe\\xb7\\xe9\\xb2\\x81\\xc2\\xb7\\xe6\\x96\\xaf\\xe7\\xa7\\x91\\xe7\\x89\\xb9 / \\xe4\\xb8\\xb9\\xe5\\xb0\\xbc\\xe5\\xb0\\x94\\xc2\\xb7\\xe6\\xa2\\x85\\xe6\\x96\\xaf / \\xe9\\x98\\xbf\\xe5\\xbe\\xb7\\xe9\\x87\\x8c\\xe5\\xae\\x89\\xc2\\xb7\\xe6\\x96\\xaf\\xe5\\x8d\\xa1\\xe4\\xbc\\xaf\\xe5\\x8b\\x92 / \\xe7\\xba\\xa6\\xe7\\xbf\\xb0\\xc2\\xb7\\xe9\\x9c\\x8d\\xe6\\x9e\\x97\\xe6\\xb2\\x83\\xe6\\x80\\x9d / \\xe5\\x85\\x8b\\xe9\\x87\\x8c\\xe6\\x96\\xaf\\xc2\\xb7\\xe7\\x93\\xa6\\xe5\\x88\\xa9...</p>\\n\\n                    \\n\\n\\n                        \\n                        <div class=\"star clearfix\">\\n                                <span class=\"allstar45\"></span>\\n                                <span class=\"rating_nums\">8.5</span>\\n                                <span class=\"pl\">(152102\\xe4\\xba\\xba\\xe8\\xaf\\x84\\xe4\\xbb\\xb7)</span>\\n\\n                        </div>\\n\\n\\n                </div>\\n\\n            </td>\\n        </tr>\\n    </table>\\n    <div id=\"collect_form_30252495\"></div>\\n    <p class=\"ul\"></p>\\n    <table width=\"100%\" class=\"\">\\n        <tr class=\"item\">\\n            <td width=\"100\" valign=\"top\">\\n                \\n\\n                    <a class=\"nbg\" href=\"https://movie.douban.com/subject/26348103/\"  title=\"\\xe5\\xb0\\x8f\\xe5\\xa6\\x87\\xe4\\xba\\xba\">\\n                        <img src=\"https://img1.doubanio.com/view/photo/s_ratio_poster/public/p2575325937.jpg\" width=\"75\" alt=\"\\xe5\\xb0\\x8f\\xe5\\xa6\\x87\\xe4\\xba\\xba\" class=\"\"/>\\n                    </a>\\n            </td>\\n\\n            <td valign=\"top\">\\n                \\n\\n                <div class=\"pl2\">\\n\\n                    <a href=\"https://movie.douban.com/subject/26348103/\"  class=\"\">\\n                        \\xe5\\xb0\\x8f\\xe5\\xa6\\x87\\xe4\\xba\\xba\\n                        / <span style=\"font-size:13px;\">\\xe5\\xa5\\xb9\\xe4\\xbb\\xac(\\xe5\\x8f\\xb0)</span>\\n                    </a>\\n\\n\\n\\n                    <p class=\"pl\">2019-12-25(\\xe7\\xbe\\x8e\\xe5\\x9b\\xbd) / 2020(\\xe4\\xb8\\xad\\xe5\\x9b\\xbd\\xe5\\xa4\\xa7\\xe9\\x99\\x86) / \\xe8\\xa5\\xbf\\xe5\\xb0\\x94\\xe8\\x8e\\x8e\\xc2\\xb7\\xe7\\xbd\\x97\\xe5\\x8d\\x97 / \\xe8\\x89\\xbe\\xe7\\x8e\\x9b\\xc2\\xb7\\xe6\\xb2\\x83\\xe6\\xa3\\xae / \\xe5\\xbc\\x97\\xe6\\xb4\\x9b\\xe4\\xbc\\xa6\\xe6\\x96\\xaf\\xc2\\xb7\\xe7\\x9a\\xae\\xe5\\xb0\\xa4 / \\xe4\\xbc\\x8a\\xe8\\x8e\\xb1\\xe6\\x89\\x8e\\xc2\\xb7\\xe6\\x96\\xaf\\xe5\\x9d\\x8e\\xe4\\xbc\\xa6 / \\xe5\\x8a\\xb3\\xe6\\x8b\\x89\\xc2\\xb7\\xe9\\x82\\x93\\xe6\\x81\\xa9 / \\xe8\\x92\\x82\\xe8\\x8e\\xab\\xe8\\xa5\\xbf\\xc2\\xb7\\xe6\\x9f\\xb4\\xe5\\x8b\\x92\\xe6\\xa2\\x85\\xe5\\xbe\\xb7 / \\xe6\\xa2\\x85\\xe4\\xb8\\xbd\\xe5\\xb0\\x94\\xc2\\xb7\\xe6\\x96\\xaf\\xe7\\x89\\xb9\\xe9\\x87\\x8c\\xe6\\x99\\xae / \\xe9\\xb2\\x8d\\xe5\\x8b\\x83\\xc2\\xb7\\xe5\\xa5\\xa5\\xe7\\x99\\xbb\\xe7\\xa7\\x91\\xe5\\x85\\x8b / \\xe8\\xa9\\xb9\\xe5\\xa7\\x86\\xe6\\x96\\xaf\\xc2\\xb7\\xe8\\xaf\\xba\\xe9\\xa1\\xbf / \\xe8\\xb7\\xaf\\xe6\\x98\\x93\\xc2\\xb7\\xe5\\x8a\\xa0\\xe7\\x91\\x9e\\xe5\\xb0\\x94 / \\xe5\\x85\\x8b\\xe9\\x87\\x8c\\xe6\\x96\\xaf\\xc2\\xb7\\xe5\\xba\\x93\\xe7\\x8f\\x80 / \\xe5\\xb4\\x94\\xe8\\xa5\\xbf\\xc2\\xb7\\xe8\\x8e\\xb1\\xe8\\x8c\\xa8 / \\xe8\\x89\\xbe\\xe6\\xaf\\x94\\xc2\\xb7\\xe5\\xa5\\x8e\\xe5\\x9b\\xa0...</p>\\n\\n                    \\n\\n\\n                        \\n                        <div class=\"star clearfix\">\\n                                <span class=\"allstar40\"></span>\\n                                <span class=\"rating_nums\">8.1</span>\\n                                <span class=\"pl\">(118362\\xe4\\xba\\xba\\xe8\\xaf\\x84\\xe4\\xbb\\xb7)</span>\\n\\n                        </div>\\n\\n\\n                </div>\\n\\n            </td>\\n        </tr>\\n    </table>\\n    <div id=\"collect_form_26348103\"></div>\\n    <p class=\"ul\"></p>\\n    <table width=\"100%\" class=\"\">\\n        <tr class=\"item\">\\n            <td width=\"100\" valign=\"top\">\\n                \\n\\n                    <a class=\"nbg\" href=\"https://movie.douban.com/subject/27010768/\"  title=\"\\xe5\\xaf\\x84\\xe7\\x94\\x9f\\xe8\\x99\\xab\">\\n                        <img src=\"https://img3.doubanio.com/view/photo/s_ratio_poster/public/p2561439800.jpg\" width=\"75\" alt=\"\\xe5\\xaf\\x84\\xe7\\x94\\x9f\\xe8\\x99\\xab\" class=\"\"/>\\n                    </a>\\n            </td>\\n\\n            <td valign=\"top\">\\n                \\n\\n                <div class=\"pl2\">\\n\\n                    <a href=\"https://movie.douban.com/subject/27010768/\"  class=\"\">\\n                        \\xe5\\xaf\\x84\\xe7\\x94\\x9f\\xe8\\x99\\xab\\n                        / <span style=\"font-size:13px;\">\\xe5\\xaf\\x84\\xe7\\x94\\x9f\\xe4\\xb8\\x8a\\xe6\\xb5\\x81(\\xe5\\x8f\\xb0) / \\xe4\\xb8\\x8a\\xe6\\xb5\\x81\\xe5\\xaf\\x84\\xe7\\x94\\x9f\\xe6\\x97\\x8f(\\xe6\\xb8\\xaf)</span>\\n                    </a>\\n\\n\\n\\n                    <p class=\"pl\">2019-05-21(\\xe6\\x88\\x9b\\xe7\\xba\\xb3\\xe7\\x94\\xb5\\xe5\\xbd\\xb1\\xe8\\x8a\\x82) / 2019-05-30(\\xe9\\x9f\\xa9\\xe5\\x9b\\xbd) / \\xe5\\xae\\x8b\\xe5\\xba\\xb7\\xe6\\x98\\x8a / \\xe6\\x9d\\x8e\\xe5\\x96\\x84\\xe5\\x9d\\x87 / \\xe8\\xb5\\xb5\\xe6\\xb1\\x9d\\xe8\\xb4\\x9e / \\xe5\\xb4\\x94\\xe5\\xae\\x87\\xe6\\xa4\\x8d / \\xe6\\x9c\\xb4\\xe7\\xb4\\xa0\\xe4\\xb8\\xb9 / \\xe6\\x9d\\x8e\\xe9\\x9d\\x99\\xe6\\x81\\xa9 / \\xe5\\xbc\\xa0\\xe6\\x85\\xa7\\xe7\\x8f\\x8d / \\xe9\\x83\\x91\\xe7\\x9f\\xa5\\xe6\\x99\\x93 / \\xe6\\x9c\\xb4\\xe6\\x98\\x8e\\xe5\\x8b\\x8b / \\xe6\\x9c\\xb4\\xe5\\x8f\\x99\\xe4\\xbf\\x8a / \\xe6\\x9c\\xb4\\xe6\\xa0\\xb9\\xe7\\xa5\\xbf / \\xe9\\x83\\x91\\xe8\\xb4\\xa4\\xe4\\xbf\\x8a / \\xe6\\x9c\\xb4\\xe5\\xad\\x9d\\xe6\\x96\\xb0 / \\xe5\\xae\\x89\\xe5\\xbe\\xb7\\xe7\\x83\\x88\\xe4\\xba\\x9a\\xe6\\x96\\xaf\\xc2\\xb7\\xe5\\xbc\\x97\\xe9\\xbe\\x99\\xe5\\x85\\x8b / \\xe9\\x83\\x91\\xe7\\x9b\\x8a\\xe6\\xb1\\x89 / \\xe6\\x9d\\x8e\\xe4\\xb8\\x9c\\xe5\\x8b\\x87 / \\xe6\\x9d\\x8e\\xe6\\x9f\\xb1\\xe4\\xba\\xa8 / \\xe6\\x9e\\x97\\xe8\\x89\\xba\\xe6\\x81\\xa9 / \\xe9\\x9f\\xa9\\xe5\\x9b\\xbd / \\xe5\\xa5\\x89\\xe4\\xbf\\x8a\\xe6\\x98\\x8a...</p>\\n\\n                    \\n\\n\\n                        \\n                        <div class=\"star clearfix\">\\n                                <span class=\"allstar45\"></span>\\n                                <span class=\"rating_nums\">8.7</span>\\n                                <span class=\"pl\">(894668\\xe4\\xba\\xba\\xe8\\xaf\\x84\\xe4\\xbb\\xb7)</span>\\n\\n                        </div>\\n\\n\\n                </div>\\n\\n            </td>\\n        </tr>\\n    </table>\\n    <div id=\"collect_form_27010768\"></div>\\n    <p class=\"ul\"></p>\\n    <table width=\"100%\" class=\"\">\\n        <tr class=\"item\">\\n            <td width=\"100\" valign=\"top\">\\n                \\n\\n                    <a class=\"nbg\" href=\"https://movie.douban.com/subject/30241298/\"  title=\"\\xe5\\x8d\\x97\\xe5\\xb1\\xb1\\xe7\\x9a\\x84\\xe9\\x83\\xa8\\xe9\\x95\\xbf\\xe4\\xbb\\xac\">\\n                        <img src=\"https://img3.doubanio.com/view/photo/s_ratio_poster/public/p2581888792.jpg\" width=\"75\" alt=\"\\xe5\\x8d\\x97\\xe5\\xb1\\xb1\\xe7\\x9a\\x84\\xe9\\x83\\xa8\\xe9\\x95\\xbf\\xe4\\xbb\\xac\" class=\"\"/>\\n                    </a>\\n            </td>\\n\\n            <td valign=\"top\">\\n                \\n\\n                <div class=\"pl2\">\\n\\n                    <a href=\"https://movie.douban.com/subject/30241298/\"  class=\"\">\\n                        \\xe5\\x8d\\x97\\xe5\\xb1\\xb1\\xe7\\x9a\\x84\\xe9\\x83\\xa8\\xe9\\x95\\xbf\\xe4\\xbb\\xac\\n                        / <span style=\"font-size:13px;\">The Man Standing Next</span>\\n                    </a>\\n\\n\\n\\n                    <p class=\"pl\">2020-01-22(\\xe9\\x9f\\xa9\\xe5\\x9b\\xbd) / \\xe6\\x9d\\x8e\\xe7\\xa7\\x89\\xe5\\xae\\xaa / \\xe6\\x9d\\x8e\\xe6\\x98\\x9f\\xe6\\xb0\\x91 / \\xe9\\x83\\xad\\xe5\\xba\\xa6\\xe6\\xb2\\x85 / \\xe6\\x9d\\x8e\\xe7\\x86\\x99\\xe4\\xbf\\x8a / \\xe9\\x87\\x91\\xe7\\xb4\\xa0\\xe7\\x9c\\x9f / \\xe5\\xbe\\x90\\xe8\\xb4\\xa4\\xe5\\xae\\x87 / \\xe6\\x9c\\xb4\\xe6\\x99\\xba\\xe4\\xb8\\x80 / \\xe6\\x9d\\x8e\\xe6\\xb3\\xb0\\xe4\\xba\\xa8 / \\xe9\\x87\\x91\\xe6\\x98\\x87\\xe5\\x8b\\x8b / \\xe9\\x87\\x91\\xe6\\x98\\x8e\\xe5\\x96\\x84  / \\xe6\\x9c\\xb4\\xe6\\x88\\x90\\xe6\\xa0\\xb9 / \\xe9\\x83\\x91\\xe9\\x92\\x9f\\xe5\\xae\\x87 / \\xe9\\x87\\x91\\xe6\\xb0\\x91\\xe5\\xb0\\x9a / \\xe5\\x91\\xa8\\xe9\\x94\\xa1\\xe6\\xb3\\xb0 / \\xe6\\x88\\x90\\xe6\\xb0\\x91\\xe7\\xa7\\x80 / \\xe8\\xb5\\xb5\\xe6\\x83\\xa0\\xe7\\x8f\\xa0 / \\xe5\\xad\\x99\\xe7\\x82\\xb3\\xe6\\x97\\xad / \\xe6\\x9c\\xb4\\xe7\\x82\\xab\\xe5\\xae\\x87 / \\xe4\\xb8\\xa5\\xe5\\xbf\\x97\\xe6\\xbb\\xa1 / \\xe6\\x9f\\xb3\\xe6\\xad\\xa3\\xe6\\xb5\\xa9 / \\xe9\\x87\\x91\\xe5\\xbc\\x98\\xe6\\xb3\\xa2 / \\xe6\\x9d\\x8e\\xe4\\xb8\\x9c\\xe5\\x9b\\xbd / \\xe9\\x9f\\xa9\\xe5\\x9b\\xbd / \\xe7\\xa6\\xb9\\xe6\\xb0\\x91\\xe9\\x95\\x90...</p>\\n\\n                    \\n\\n\\n                        \\n                        <div class=\"star clearfix\">\\n                                <span class=\"allstar40\"></span>\\n                                <span class=\"rating_nums\">8.2</span>\\n                                <span class=\"pl\">(49775\\xe4\\xba\\xba\\xe8\\xaf\\x84\\xe4\\xbb\\xb7)</span>\\n\\n                        </div>\\n\\n\\n                </div>\\n\\n            </td>\\n        </tr>\\n    </table>\\n    <div id=\"collect_form_30241298\"></div>\\n    <p class=\"ul\"></p>\\n    <table width=\"100%\" class=\"\">\\n        <tr class=\"item\">\\n            <td width=\"100\" valign=\"top\">\\n                \\n\\n                    <a class=\"nbg\" href=\"https://movie.douban.com/subject/30160393/\"  title=\"\\xe7\\x8c\\x9b\\xe7\\xa6\\xbd\\xe5\\xb0\\x8f\\xe9\\x98\\x9f\\xe5\\x92\\x8c\\xe5\\x93\\x88\\xe8\\x8e\\x89\\xc2\\xb7\\xe5\\xa5\\x8e\\xe8\\x8c\\xb5\">\\n                        <img src=\"https://img1.doubanio.com/view/photo/s_ratio_poster/public/p2575974437.jpg\" width=\"75\" alt=\"\\xe7\\x8c\\x9b\\xe7\\xa6\\xbd\\xe5\\xb0\\x8f\\xe9\\x98\\x9f\\xe5\\x92\\x8c\\xe5\\x93\\x88\\xe8\\x8e\\x89\\xc2\\xb7\\xe5\\xa5\\x8e\\xe8\\x8c\\xb5\" class=\"\"/>\\n                    </a>\\n            </td>\\n\\n            <td valign=\"top\">\\n                \\n\\n                <div class=\"pl2\">\\n\\n                    <a href=\"https://movie.douban.com/subject/30160393/\"  class=\"\">\\n                        \\xe7\\x8c\\x9b\\xe7\\xa6\\xbd\\xe5\\xb0\\x8f\\xe9\\x98\\x9f\\xe5\\x92\\x8c\\xe5\\x93\\x88\\xe8\\x8e\\x89\\xc2\\xb7\\xe5\\xa5\\x8e\\xe8\\x8c\\xb5\\n                        / <span style=\"font-size:13px;\">\\xe5\\x93\\x88\\xe8\\x8e\\x89\\xc2\\xb7\\xe5\\xa5\\x8e\\xe5\\x9b\\xa0\\xef\\xbc\\x9a\\xe7\\x8c\\x9b\\xe7\\xa6\\xbd\\xe5\\xb0\\x8f\\xe9\\x98\\x9f / \\xe7\\x8c\\x9b\\xe7\\xa6\\xbd\\xe5\\xb0\\x8f\\xe9\\x98\\x9f</span>\\n                    </a>\\n\\n\\n\\n                    <p class=\"pl\">2020-02-07(\\xe7\\xbe\\x8e\\xe5\\x9b\\xbd) / \\xe7\\x8e\\x9b\\xe6\\xa0\\xbc\\xe7\\x89\\xb9\\xc2\\xb7\\xe7\\xbd\\x97\\xe6\\xaf\\x94 / \\xe7\\x8e\\x9b\\xe4\\xb8\\xbd\\xc2\\xb7\\xe4\\xbc\\x8a\\xe4\\xb8\\xbd\\xe8\\x8e\\x8e\\xe7\\x99\\xbd\\xc2\\xb7\\xe6\\xb8\\xa9\\xe6\\x96\\xaf\\xe7\\x89\\xb9\\xe5\\xbe\\xb7 / \\xe7\\xbd\\x97\\xe8\\x8c\\x9c\\xc2\\xb7\\xe4\\xbd\\xa9\\xe9\\x9b\\xb7\\xe5\\x85\\xb9 / \\xe6\\x9c\\xb1\\xe5\\xb0\\xbc\\xc2\\xb7\\xe6\\x96\\xaf\\xe8\\x8e\\xab\\xe5\\x88\\xa9\\xe7\\x89\\xb9 / \\xe4\\xbc\\x8a\\xe4\\xb8\\x87\\xc2\\xb7\\xe9\\xba\\xa6\\xe5\\x85\\x8b\\xe6\\xa0\\xbc\\xe9\\x9b\\xb7\\xe6\\xa0\\xbc / \\xe5\\x9f\\x83\\xe6\\x8b\\x89\\xc2\\xb7\\xe6\\x9d\\xb0\\xe4\\xbc\\x8a\\xc2\\xb7\\xe5\\xb7\\xb4\\xe6\\x96\\xaf\\xe7\\xa7\\x91 / \\xe5\\x85\\x8b\\xe9\\x87\\x8c\\xe6\\x96\\xaf\\xc2\\xb7\\xe6\\xa2\\x85\\xe8\\xa5\\xbf\\xe7\\xba\\xb3 / \\xe9\\xbb\\x84\\xe9\\x98\\xbf\\xe4\\xb8\\xbd / \\xe6\\x88\\xb4\\xe7\\xbb\\xb4\\xc2\\xb7\\xe5\\xb0\\xa4\\xe9\\x87\\x8c / \\xe8\\x90\\xa8\\xe6\\x8b\\x89\\xc2\\xb7\\xe8\\x92\\x99\\xe7\\x89\\xb9\\xe6\\x96\\xaf / \\xe4\\xbc\\x8a\\xe8\\x8e\\x8e\\xe8\\xb4\\x9d\\xe5\\xb0\\x94\\xc2\\xb7\\xe5\\xb8\\x95\\xe5\\x85\\x8b\\xe6\\x89\\x8e\\xe5\\xbe\\xb7 / \\xe4\\xb8\\xb9\\xe5\\xb0\\xbc\\xe5\\xb0\\x94\\xc2\\xb7\\xe4\\xbc\\xaf\\xe5\\x93\\x88\\xe7\\x89\\xb9 / \\xe5\\xb8\\x95\\xe6\\xb4\\x9b\\xe9\\xa9\\xac\\xc2\\xb7\\xe6\\x8b\\x89\\xe6\\xaf\\x94\\xe8\\xaf\\xba\\xe5\\xa4\\xab...</p>\\n\\n                    \\n\\n\\n                        \\n                        <div class=\"star clearfix\">\\n                                <span class=\"allstar30\"></span>\\n                                <span class=\"rating_nums\">5.9</span>\\n                                <span class=\"pl\">(30201\\xe4\\xba\\xba\\xe8\\xaf\\x84\\xe4\\xbb\\xb7)</span>\\n\\n                        </div>\\n\\n\\n                </div>\\n\\n            </td>\\n        </tr>\\n    </table>\\n    <div id=\"collect_form_30160393\"></div>\\n    <p class=\"ul\"></p>\\n    <table width=\"100%\" class=\"\">\\n        <tr class=\"item\">\\n            <td width=\"100\" valign=\"top\">\\n                \\n\\n                    <a class=\"nbg\" href=\"https://movie.douban.com/subject/27119724/\"  title=\"\\xe5\\xb0\\x8f\\xe4\\xb8\\x91\">\\n                        <img src=\"https://img9.doubanio.com/view/photo/s_ratio_poster/public/p2567198874.jpg\" width=\"75\" alt=\"\\xe5\\xb0\\x8f\\xe4\\xb8\\x91\" class=\"\"/>\\n                    </a>\\n            </td>\\n\\n            <td valign=\"top\">\\n                \\n\\n                <div class=\"pl2\">\\n\\n                    <a href=\"https://movie.douban.com/subject/27119724/\"  class=\"\">\\n                        \\xe5\\xb0\\x8f\\xe4\\xb8\\x91\\n                        / <span style=\"font-size:13px;\">\\xe5\\xb0\\x8f\\xe4\\xb8\\x91\\xe8\\xb5\\xb7\\xe6\\xba\\x90\\xe7\\x94\\xb5\\xe5\\xbd\\xb1\\xef\\xbc\\x9a\\xe7\\xbd\\x97\\xe5\\xaf\\x86\\xe6\\xac\\xa7 / Romeo</span>\\n                    </a>\\n\\n\\n\\n                    <p class=\"pl\">2019-08-31(\\xe5\\xa8\\x81\\xe5\\xb0\\xbc\\xe6\\x96\\xaf\\xe7\\x94\\xb5\\xe5\\xbd\\xb1\\xe8\\x8a\\x82) / 2019-10-04(\\xe7\\xbe\\x8e\\xe5\\x9b\\xbd) / \\xe5\\x8d\\x8e\\xe9\\x87\\x91\\xc2\\xb7\\xe8\\x8f\\xb2\\xe5\\xb0\\xbc\\xe5\\x85\\x8b\\xe6\\x96\\xaf / \\xe7\\xbd\\x97\\xe4\\xbc\\xaf\\xe7\\x89\\xb9\\xc2\\xb7\\xe5\\xbe\\xb7\\xe5\\xb0\\xbc\\xe7\\xbd\\x97 / \\xe9\\xa9\\xac\\xe5\\x85\\x8b\\xc2\\xb7\\xe9\\xa9\\xac\\xe9\\xbe\\x99 / \\xe8\\x8e\\x8e\\xe5\\xa7\\xac\\xc2\\xb7\\xe8\\xb4\\x9d\\xe5\\x85\\xb9 / \\xe8\\xb0\\xa2\\xe4\\xbc\\x8a\\xc2\\xb7\\xe6\\x83\\xa0\\xe6\\xa0\\xbc\\xe5\\xa7\\x86 / \\xe5\\xbc\\x97\\xe5\\x85\\xb0\\xe8\\xa5\\xbf\\xe4\\xb8\\x9d\\xc2\\xb7\\xe5\\xba\\xb7\\xe7\\xbd\\x97\\xe4\\xbc\\x8a / \\xe5\\xb8\\x83\\xe8\\x8e\\xb1\\xe6\\x81\\xa9\\xc2\\xb7\\xe8\\x80\\x83\\xe4\\xbc\\xa6 / \\xe5\\xb8\\x83\\xe8\\x8e\\xb1\\xe6\\x81\\xa9\\xc2\\xb7\\xe6\\xb3\\xb0\\xe9\\x87\\x8c\\xc2\\xb7\\xe4\\xba\\xa8\\xe5\\x88\\xa9 / \\xe5\\xb8\\x83\\xe8\\x8e\\xb1\\xe7\\x89\\xb9\\xc2\\xb7\\xe5\\x8d\\xa1\\xe4\\xbc\\xa6 / \\xe9\\x81\\x93\\xe6\\xa0\\xbc\\xe6\\x8b\\x89\\xe6\\x96\\xaf\\xc2\\xb7\\xe9\\x9c\\x8d\\xe5\\xa5\\x87\\xe6\\x96\\xaf / \\xe6\\xa0\\xbc\\xe4\\xbc\\xa6\\xc2\\xb7\\xe5\\xbc\\x97\\xe8\\x8e\\xb1\\xe6\\x96\\xbd\\xe5\\x8b\\x92 / \\xe6\\xaf\\x94\\xe5\\xb0\\x94\\xc2\\xb7\\xe5\\x9d\\x8e\\xe6\\x99\\xae...</p>\\n\\n                    \\n\\n\\n                        \\n                        <div class=\"star clearfix\">\\n                                <span class=\"allstar45\"></span>\\n                                <span class=\"rating_nums\">8.7</span>\\n                                <span class=\"pl\">(645927\\xe4\\xba\\xba\\xe8\\xaf\\x84\\xe4\\xbb\\xb7)</span>\\n\\n                        </div>\\n\\n\\n                </div>\\n\\n            </td>\\n        </tr>\\n    </table>\\n    <div id=\"collect_form_27119724\"></div>\\n    <p class=\"ul\"></p>\\n    <table width=\"100%\" class=\"\">\\n        <tr class=\"item\">\\n            <td width=\"100\" valign=\"top\">\\n                \\n\\n                    <a class=\"nbg\" href=\"https://movie.douban.com/subject/30170546/\"  title=\"\\xe4\\xb9\\x94\\xe4\\xb9\\x94\\xe7\\x9a\\x84\\xe5\\xbc\\x82\\xe6\\x83\\xb3\\xe4\\xb8\\x96\\xe7\\x95\\x8c\">\\n                        <img src=\"https://img3.doubanio.com/view/photo/s_ratio_poster/public/p2567973073.jpg\" width=\"75\" alt=\"\\xe4\\xb9\\x94\\xe4\\xb9\\x94\\xe7\\x9a\\x84\\xe5\\xbc\\x82\\xe6\\x83\\xb3\\xe4\\xb8\\x96\\xe7\\x95\\x8c\" class=\"\"/>\\n                    </a>\\n            </td>\\n\\n            <td valign=\"top\">\\n                \\n\\n                <div class=\"pl2\">\\n\\n                    <a href=\"https://movie.douban.com/subject/30170546/\"  class=\"\">\\n                        \\xe4\\xb9\\x94\\xe4\\xb9\\x94\\xe7\\x9a\\x84\\xe5\\xbc\\x82\\xe6\\x83\\xb3\\xe4\\xb8\\x96\\xe7\\x95\\x8c\\n                        / <span style=\"font-size:13px;\">\\xe4\\xb9\\x94\\xe4\\xb9\\x94\\xe5\\x85\\x94 / \\xe5\\xb0\\x91\\xe5\\xb9\\xb4\\xe4\\xb9\\x94\\xe4\\xb9\\x94\\xe7\\x9a\\x84\\xe5\\xbc\\x82\\xe6\\x83\\xb3\\xe4\\xb8\\x96\\xe7\\x95\\x8c</span>\\n                    </a>\\n\\n\\n\\n                    <p class=\"pl\">2019-09-08(\\xe5\\xa4\\x9a\\xe4\\xbc\\xa6\\xe5\\xa4\\x9a\\xe7\\x94\\xb5\\xe5\\xbd\\xb1\\xe8\\x8a\\x82) / 2019-11-08(\\xe7\\xbe\\x8e\\xe5\\x9b\\xbd) / 2020(\\xe4\\xb8\\xad\\xe5\\x9b\\xbd\\xe5\\xa4\\xa7\\xe9\\x99\\x86) / \\xe7\\xbd\\x97\\xe6\\x9b\\xbc\\xc2\\xb7\\xe6\\xa0\\xbc\\xe9\\x87\\x8c\\xe8\\x8a\\xac\\xc2\\xb7\\xe6\\x88\\xb4\\xe7\\xbb\\xb4\\xe6\\x96\\xaf / \\xe6\\x89\\x98\\xe9\\xa9\\xac\\xe8\\xbe\\x9b\\xc2\\xb7\\xe9\\xba\\xa6\\xe8\\x82\\xaf\\xe9\\xbd\\x90 / \\xe6\\x96\\xaf\\xe5\\x98\\x89\\xe4\\xb8\\xbd\\xc2\\xb7\\xe7\\xba\\xa6\\xe7\\xbf\\xb0\\xe9\\x80\\x8a / \\xe5\\xa1\\x94\\xe4\\xbc\\x8a\\xe5\\x8a\\xa0\\xc2\\xb7\\xe7\\xbb\\xb4\\xe8\\xbf\\xaa\\xe6\\x8f\\x90 / \\xe5\\xb1\\xb1\\xe5\\xa7\\x86\\xc2\\xb7\\xe6\\xb4\\x9b\\xe5\\x85\\x8b\\xe5\\xa8\\x81\\xe5\\xb0\\x94 / \\xe8\\x95\\xbe\\xe8\\x93\\x93\\xe5\\xb0\\x94\\xc2\\xb7\\xe5\\xa8\\x81\\xe5\\xb0\\x94\\xe6\\xa3\\xae / \\xe9\\x98\\xbf\\xe5\\xb0\\x94\\xe8\\x8f\\xb2\\xc2\\xb7\\xe8\\x89\\xbe\\xe4\\xbc\\xa6 / \\xe6\\x96\\xaf\\xe6\\x88\\xb4\\xe8\\x8a\\xac\\xc2\\xb7\\xe8\\x8e\\xab\\xe6\\x98\\x8c\\xe7\\x89\\xb9 / \\xe9\\x98\\xbf\\xe5\\xa5\\x87\\xc2\\xb7\\xe8\\x80\\xb6\\xe8\\x8c\\xa8 / \\xe5\\x8d\\xa2\\xe5\\x85\\x8b\\xc2\\xb7\\xe5\\xb8\\x83\\xe5\\x85\\xb0\\xe7\\x99\\xbb\\xc2\\xb7\\xe8\\x8f\\xb2\\xe5\\xb0\\x94\\xe5\\xbe\\xb7...</p>\\n\\n                    \\n\\n\\n                        \\n                        <div class=\"star clearfix\">\\n                                <span class=\"allstar40\"></span>\\n                                <span class=\"rating_nums\">8.4</span>\\n                                <span class=\"pl\">(128547\\xe4\\xba\\xba\\xe8\\xaf\\x84\\xe4\\xbb\\xb7)</span>\\n\\n                        </div>\\n\\n\\n                </div>\\n\\n            </td>\\n        </tr>\\n    </table>\\n    <div id=\"collect_form_30170546\"></div>\\n    <p class=\"ul\"></p>\\n    <table width=\"100%\" class=\"\">\\n        <tr class=\"item\">\\n            <td width=\"100\" valign=\"top\">\\n                \\n\\n                    <a class=\"nbg\" href=\"https://movie.douban.com/subject/30292777/\"  title=\"\\xe9\\x98\\xb3\\xe5\\x85\\x89\\xe6\\x99\\xae\\xe7\\x85\\xa7\">\\n                        <img src=\"https://img3.doubanio.com/view/photo/s_ratio_poster/public/p2570235120.jpg\" width=\"75\" alt=\"\\xe9\\x98\\xb3\\xe5\\x85\\x89\\xe6\\x99\\xae\\xe7\\x85\\xa7\" class=\"\"/>\\n                    </a>\\n            </td>\\n\\n            <td valign=\"top\">\\n                \\n\\n                <div class=\"pl2\">\\n\\n                    <a href=\"https://movie.douban.com/subject/30292777/\"  class=\"\">\\n                        \\xe9\\x98\\xb3\\xe5\\x85\\x89\\xe6\\x99\\xae\\xe7\\x85\\xa7\\n                        / <span style=\"font-size:13px;\">A Sun</span>\\n                    </a>\\n\\n\\n\\n                    <p class=\"pl\">2019-09-06(\\xe5\\xa4\\x9a\\xe4\\xbc\\xa6\\xe5\\xa4\\x9a\\xe7\\x94\\xb5\\xe5\\xbd\\xb1\\xe8\\x8a\\x82) / 2019-11-01(\\xe4\\xb8\\xad\\xe5\\x9b\\xbd\\xe5\\x8f\\xb0\\xe6\\xb9\\xbe) / \\xe9\\x99\\x88\\xe4\\xbb\\xa5\\xe6\\x96\\x87 / \\xe6\\x9f\\xaf\\xe6\\xb7\\x91\\xe5\\x8b\\xa4 / \\xe5\\xb7\\xab\\xe5\\xbb\\xba\\xe5\\x92\\x8c / \\xe5\\x88\\x98\\xe5\\x86\\xa0\\xe5\\xbb\\xb7 / \\xe8\\xae\\xb8\\xe5\\x85\\x89\\xe6\\xb1\\x89 / \\xe5\\xb0\\xb9\\xe9\\xa6\\xa8 / \\xe6\\xb8\\xa9\\xe8\\xb4\\x9e\\xe8\\x8f\\xb1 / \\xe5\\x90\\xb4\\xe5\\xb2\\xb1\\xe5\\x87\\x8c / \\xe6\\x9e\\x97\\xe5\\xbf\\x97\\xe5\\x84\\x92 / \\xe9\\xbe\\x99\\xe5\\x8a\\xad\\xe5\\x8d\\x8e / \\xe8\\x83\\xa1\\xe9\\xb8\\xbf\\xe8\\xbe\\xbe / \\xe6\\x96\\xbd\\xe5\\x90\\x8d\\xe5\\xb8\\x85 / \\xe5\\xbc\\xa0\\xe7\\xab\\x8b\\xe4\\xb8\\x9c / \\xe5\\xbc\\xa0\\xe5\\xb0\\x91\\xe6\\x80\\x80 / \\xe9\\xbb\\x84\\xe4\\xbf\\xa1\\xe5\\xb0\\xa7 / \\xe5\\xbc\\xa0\\xe7\\xbf\\xb0 / \\xe8\\x8c\\x83\\xe5\\xa7\\x9c\\xe6\\xb3\\xb0\\xe5\\x9f\\xba / \\xe5\\xbc\\xa0\\xe8\\x80\\x80\\xe5\\x8d\\x87 / \\xe4\\xb8\\xad\\xe5\\x9b\\xbd\\xe5\\x8f\\xb0\\xe6\\xb9\\xbe / \\xe9\\x92\\x9f\\xe5\\xad\\x9f\\xe5\\xae\\x8f / 155\\xe5\\x88\\x86\\xe9\\x92\\x9f...</p>\\n\\n                    \\n\\n\\n                        \\n                        <div class=\"star clearfix\">\\n                                <span class=\"allstar40\"></span>\\n                                <span class=\"rating_nums\">8.4</span>\\n                                <span class=\"pl\">(112475\\xe4\\xba\\xba\\xe8\\xaf\\x84\\xe4\\xbb\\xb7)</span>\\n\\n                        </div>\\n\\n\\n                </div>\\n\\n            </td>\\n        </tr>\\n    </table>\\n    <div id=\"collect_form_30292777\"></div>\\n    <p class=\"ul\"></p>\\n    <table width=\"100%\" class=\"\">\\n        <tr class=\"item\">\\n            <td width=\"100\" valign=\"top\">\\n                \\n\\n                    <a class=\"nbg\" href=\"https://movie.douban.com/subject/30318116/\"  title=\"\\xe5\\x88\\xa9\\xe5\\x88\\x83\\xe5\\x87\\xba\\xe9\\x9e\\x98\">\\n                        <img src=\"https://img1.doubanio.com/view/photo/s_ratio_poster/public/p2574172427.jpg\" width=\"75\" alt=\"\\xe5\\x88\\xa9\\xe5\\x88\\x83\\xe5\\x87\\xba\\xe9\\x9e\\x98\" class=\"\"/>\\n                    </a>\\n            </td>\\n\\n            <td valign=\"top\">\\n                \\n\\n                <div class=\"pl2\">\\n\\n                    <a href=\"https://movie.douban.com/subject/30318116/\"  class=\"\">\\n                        \\xe5\\x88\\xa9\\xe5\\x88\\x83\\xe5\\x87\\xba\\xe9\\x9e\\x98\\n                        / <span style=\"font-size:13px;\">\\xe8\\x87\\xb4\\xe5\\x91\\xbd\\xe9\\x81\\x97\\xe4\\xba\\xa7 / \\xe9\\x94\\x8b\\xe5\\x9b\\x9e\\xe8\\xb7\\xaf\\xe8\\xbd\\xac(\\xe5\\x8f\\xb0)</span>\\n                    </a>\\n\\n\\n\\n                    <p class=\"pl\">2019-09-07(\\xe5\\xa4\\x9a\\xe4\\xbc\\xa6\\xe5\\xa4\\x9a\\xe7\\x94\\xb5\\xe5\\xbd\\xb1\\xe8\\x8a\\x82) / 2019-11-27(\\xe7\\xbe\\x8e\\xe5\\x9b\\xbd) / 2019-11-29(\\xe4\\xb8\\xad\\xe5\\x9b\\xbd\\xe5\\xa4\\xa7\\xe9\\x99\\x86) / \\xe4\\xb8\\xb9\\xe5\\xb0\\xbc\\xe5\\xb0\\x94\\xc2\\xb7\\xe5\\x85\\x8b\\xe9\\x9b\\xb7\\xe6\\xa0\\xbc / \\xe5\\xae\\x89\\xe5\\xa8\\x9c\\xc2\\xb7\\xe5\\xbe\\xb7\\xc2\\xb7\\xe9\\x98\\xbf\\xe7\\x8e\\x9b\\xe6\\x96\\xaf / \\xe5\\x85\\x8b\\xe9\\x87\\x8c\\xe6\\x96\\xaf\\xc2\\xb7\\xe5\\x9f\\x83\\xe6\\x96\\x87\\xe6\\x96\\xaf / \\xe6\\x9d\\xb0\\xe7\\xb1\\xb3\\xc2\\xb7\\xe6\\x9d\\x8e\\xc2\\xb7\\xe6\\x9f\\xaf\\xe8\\x92\\x82\\xe6\\x96\\xaf / \\xe8\\xbf\\x88\\xe5\\x85\\x8b\\xe5\\xb0\\x94\\xc2\\xb7\\xe7\\x8f\\x8a\\xe5\\x86\\x9c / \\xe5\\x94\\x90\\xc2\\xb7\\xe7\\xba\\xa6\\xe7\\xbf\\xb0\\xe9\\x80\\x8a / \\xe6\\x89\\x98\\xe5\\xa6\\xae\\xc2\\xb7\\xe7\\xa7\\x91\\xe8\\x8e\\xb1\\xe7\\x89\\xb9 / \\xe5\\x8b\\x92\\xe5\\x87\\xaf\\xe6\\x96\\xaf\\xc2\\xb7\\xe6\\x96\\xaf\\xe5\\x9d\\xa6\\xe8\\x8f\\xb2\\xe5\\xb0\\x94\\xe5\\xbe\\xb7 / \\xe5\\x85\\x8b\\xe9\\x87\\x8c\\xe6\\x96\\xaf\\xe6\\x89\\x98\\xe5\\xbc\\x97\\xc2\\xb7\\xe6\\x99\\xae\\xe5\\x8d\\xa2\\xe9\\xbb\\x98 / \\xe5\\x87\\xaf\\xe7\\x91\\x9f\\xe7\\x90\\xb3\\xc2\\xb7\\xe5\\x85\\xb0\\xe7\\xa6\\x8f\\xe5\\xbe\\xb7...</p>\\n\\n                    \\n\\n\\n                        \\n                        <div class=\"star clearfix\">\\n                                <span class=\"allstar40\"></span>\\n                                <span class=\"rating_nums\">8.2</span>\\n                                <span class=\"pl\">(392146\\xe4\\xba\\xba\\xe8\\xaf\\x84\\xe4\\xbb\\xb7)</span>\\n\\n                        </div>\\n\\n\\n                </div>\\n\\n            </td>\\n        </tr>\\n    </table>\\n    <div id=\"collect_form_30318116\"></div>\\n    <p class=\"ul\"></p>\\n    <table width=\"100%\" class=\"\">\\n        <tr class=\"item\">\\n            <td width=\"100\" valign=\"top\">\\n                \\n\\n                    <a class=\"nbg\" href=\"https://movie.douban.com/subject/30331959/\"  title=\"\\xe9\\xbb\\x91\\xe6\\xb0\\xb4\">\\n                        <img src=\"https://img3.doubanio.com/view/photo/s_ratio_poster/public/p2569450232.jpg\" width=\"75\" alt=\"\\xe9\\xbb\\x91\\xe6\\xb0\\xb4\" class=\"\"/>\\n                    </a>\\n            </td>\\n\\n            <td valign=\"top\">\\n                \\n\\n                <div class=\"pl2\">\\n\\n                    <a href=\"https://movie.douban.com/subject/30331959/\"  class=\"\">\\n                        \\xe9\\xbb\\x91\\xe6\\xb0\\xb4\\n                        / <span style=\"font-size:13px;\">\\xe8\\xbf\\xbd\\xe5\\x87\\xbb\\xe9\\xbb\\x91\\xe6\\xb0\\xb4\\xe7\\x9c\\x9f\\xe7\\x9b\\xb8(\\xe6\\xb8\\xaf) / \\xe9\\xbb\\x91\\xe6\\xb0\\xb4\\xe9\\xa3\\x8e\\xe6\\x9a\\xb4(\\xe5\\x8f\\xb0)</span>\\n                    </a>\\n\\n\\n\\n                    <p class=\"pl\">2019-11-22(\\xe7\\xbe\\x8e\\xe5\\x9b\\xbd\\xe7\\x82\\xb9\\xe6\\x98\\xa0) / 2019-12-06(\\xe7\\xbe\\x8e\\xe5\\x9b\\xbd) / \\xe9\\xa9\\xac\\xe5\\x85\\x8b\\xc2\\xb7\\xe9\\xb2\\x81\\xe5\\xbc\\x97\\xe6\\xb4\\x9b / \\xe5\\xae\\x89\\xe5\\xa6\\xae\\xc2\\xb7\\xe6\\xb5\\xb7\\xe7\\x91\\x9f\\xe8\\x96\\x87 / \\xe8\\x92\\x82\\xe5\\xa7\\x86\\xc2\\xb7\\xe7\\xbd\\x97\\xe5\\xae\\xbe\\xe6\\x96\\xaf / \\xe6\\xaf\\x94\\xe5\\xb0\\x94\\xc2\\xb7\\xe5\\x9d\\x8e\\xe6\\x99\\xae / \\xe7\\xbb\\xb4\\xe5\\x85\\x8b\\xe5\\xa4\\x9a\\xc2\\xb7\\xe5\\x8a\\xa0\\xe5\\x8d\\x9a / \\xe6\\xaf\\x94\\xe5\\xb0\\x94\\xc2\\xb7\\xe6\\x99\\xae\\xe5\\xb0\\x94\\xe6\\x9b\\xbc / \\xe6\\xa2\\x85\\xe5\\xb0\\x94\\xc2\\xb7\\xe6\\xb8\\xa9\\xe5\\xae\\x81\\xe6\\xb1\\x89\\xe5\\xa7\\x86 / \\xe5\\xa8\\x81\\xe5\\xbb\\x89\\xc2\\xb7\\xe6\\x9d\\xb0\\xe5\\x85\\x8b\\xe6\\xa3\\xae\\xc2\\xb7\\xe5\\x93\\x88\\xe7\\x8f\\x80 / \\xe8\\xb7\\xaf\\xe6\\x98\\x93\\xe8\\x8e\\x8e\\xc2\\xb7\\xe5\\x85\\x8b\\xe5\\x8a\\xb3\\xe7\\x91\\x9f / \\xe5\\x87\\xaf\\xe6\\x96\\x87\\xc2\\xb7\\xe5\\x85\\x8b\\xe5\\x8a\\xb3\\xe5\\x88\\xa9 / \\xe4\\xb8\\xb9\\xe5\\xb0\\xbc\\xe5\\xb0\\x94\\xc2\\xb7R\\xc2\\xb7\\xe5\\xb8\\x8c\\xe5\\xb0\\x94 / \\xe7\\x8e\\x8b\\xe6\\x98\\x8e / \\xe8\\xa5\\xbf\\xe5\\xb0\\xbc\\xc2\\xb7\\xe8\\xbf\\x88\\xe5\\xb0\\x94\\xe6\\x96\\xaf...</p>\\n\\n                    \\n\\n\\n                        \\n                        <div class=\"star clearfix\">\\n                                <span class=\"allstar45\"></span>\\n                                <span class=\"rating_nums\">8.5</span>\\n                                <span class=\"pl\">(39116\\xe4\\xba\\xba\\xe8\\xaf\\x84\\xe4\\xbb\\xb7)</span>\\n\\n                        </div>\\n\\n\\n                </div>\\n\\n            </td>\\n        </tr>\\n    </table>\\n    <div id=\"collect_form_30331959\"></div>\\n</div>\\n\\n\\n    </div>\\n    \\n\\n            </div>\\n            <div class=\"aside\">\\n                \\n    \\n  \\n  <div>\\n      <h2>\\xe5\\x88\\x86\\xe7\\xb1\\xbb\\xe6\\x8e\\x92\\xe8\\xa1\\x8c\\xe6\\xa6\\x9c \\xc2\\xb7 \\xc2\\xb7 \\xc2\\xb7 \\xc2\\xb7 \\xc2\\xb7 \\xc2\\xb7<img style=\" position: absolute;\" src=\"https://img3.doubanio.com/f/shire/e49eca1517424a941871a2667a8957fd6c72d632/pics/new_menu.gif\"></h2>\\n      <div class=\"types\">\\n          <span><a href=\"/typerank?type_name=\\xe5\\x89\\xa7\\xe6\\x83\\x85&type=11&interval_id=100:90&action=\">\\xe5\\x89\\xa7\\xe6\\x83\\x85</a></span>\\n          <span><a href=\"/typerank?type_name=\\xe5\\x96\\x9c\\xe5\\x89\\xa7&type=24&interval_id=100:90&action=\">\\xe5\\x96\\x9c\\xe5\\x89\\xa7</a></span>\\n          <span><a href=\"/typerank?type_name=\\xe5\\x8a\\xa8\\xe4\\xbd\\x9c&type=5&interval_id=100:90&action=\">\\xe5\\x8a\\xa8\\xe4\\xbd\\x9c</a></span>\\n          <span><a href=\"/typerank?type_name=\\xe7\\x88\\xb1\\xe6\\x83\\x85&type=13&interval_id=100:90&action=\">\\xe7\\x88\\xb1\\xe6\\x83\\x85</a></span>\\n          <span><a href=\"/typerank?type_name=\\xe7\\xa7\\x91\\xe5\\xb9\\xbb&type=17&interval_id=100:90&action=\">\\xe7\\xa7\\x91\\xe5\\xb9\\xbb</a></span>\\n          <span><a href=\"/typerank?type_name=\\xe5\\x8a\\xa8\\xe7\\x94\\xbb&type=25&interval_id=100:90&action=\">\\xe5\\x8a\\xa8\\xe7\\x94\\xbb</a></span>\\n          <span><a href=\"/typerank?type_name=\\xe6\\x82\\xac\\xe7\\x96\\x91&type=10&interval_id=100:90&action=\">\\xe6\\x82\\xac\\xe7\\x96\\x91</a></span>\\n          <span><a href=\"/typerank?type_name=\\xe6\\x83\\x8a\\xe6\\x82\\x9a&type=19&interval_id=100:90&action=\">\\xe6\\x83\\x8a\\xe6\\x82\\x9a</a></span>\\n          <span><a href=\"/typerank?type_name=\\xe6\\x81\\x90\\xe6\\x80\\x96&type=20&interval_id=100:90&action=\">\\xe6\\x81\\x90\\xe6\\x80\\x96</a></span>\\n          <span><a href=\"/typerank?type_name=\\xe7\\xba\\xaa\\xe5\\xbd\\x95\\xe7\\x89\\x87&type=1&interval_id=100:90&action=\">\\xe7\\xba\\xaa\\xe5\\xbd\\x95\\xe7\\x89\\x87</a></span>\\n          <span><a href=\"/typerank?type_name=\\xe7\\x9f\\xad\\xe7\\x89\\x87&type=23&interval_id=100:90&action=\">\\xe7\\x9f\\xad\\xe7\\x89\\x87</a></span>\\n          <span><a href=\"/typerank?type_name=\\xe6\\x83\\x85\\xe8\\x89\\xb2&type=6&interval_id=100:90&action=\">\\xe6\\x83\\x85\\xe8\\x89\\xb2</a></span>\\n          <span><a href=\"/typerank?type_name=\\xe5\\x90\\x8c\\xe6\\x80\\xa7&type=26&interval_id=100:90&action=\">\\xe5\\x90\\x8c\\xe6\\x80\\xa7</a></span>\\n          <span><a href=\"/typerank?type_name=\\xe9\\x9f\\xb3\\xe4\\xb9\\x90&type=14&interval_id=100:90&action=\">\\xe9\\x9f\\xb3\\xe4\\xb9\\x90</a></span>\\n          <span><a href=\"/typerank?type_name=\\xe6\\xad\\x8c\\xe8\\x88\\x9e&type=7&interval_id=100:90&action=\">\\xe6\\xad\\x8c\\xe8\\x88\\x9e</a></span>\\n          <span><a href=\"/typerank?type_name=\\xe5\\xae\\xb6\\xe5\\xba\\xad&type=28&interval_id=100:90&action=\">\\xe5\\xae\\xb6\\xe5\\xba\\xad</a></span>\\n          <span><a href=\"/typerank?type_name=\\xe5\\x84\\xbf\\xe7\\xab\\xa5&type=8&interval_id=100:90&action=\">\\xe5\\x84\\xbf\\xe7\\xab\\xa5</a></span>\\n          <span><a href=\"/typerank?type_name=\\xe4\\xbc\\xa0\\xe8\\xae\\xb0&type=2&interval_id=100:90&action=\">\\xe4\\xbc\\xa0\\xe8\\xae\\xb0</a></span>\\n          <span><a href=\"/typerank?type_name=\\xe5\\x8e\\x86\\xe5\\x8f\\xb2&type=4&interval_id=100:90&action=\">\\xe5\\x8e\\x86\\xe5\\x8f\\xb2</a></span>\\n          <span><a href=\"/typerank?type_name=\\xe6\\x88\\x98\\xe4\\xba\\x89&type=22&interval_id=100:90&action=\">\\xe6\\x88\\x98\\xe4\\xba\\x89</a></span>\\n          <span><a href=\"/typerank?type_name=\\xe7\\x8a\\xaf\\xe7\\xbd\\xaa&type=3&interval_id=100:90&action=\">\\xe7\\x8a\\xaf\\xe7\\xbd\\xaa</a></span>\\n          <span><a href=\"/typerank?type_name=\\xe8\\xa5\\xbf\\xe9\\x83\\xa8&type=27&interval_id=100:90&action=\">\\xe8\\xa5\\xbf\\xe9\\x83\\xa8</a></span>\\n          <span><a href=\"/typerank?type_name=\\xe5\\xa5\\x87\\xe5\\xb9\\xbb&type=16&interval_id=100:90&action=\">\\xe5\\xa5\\x87\\xe5\\xb9\\xbb</a></span>\\n          <span><a href=\"/typerank?type_name=\\xe5\\x86\\x92\\xe9\\x99\\xa9&type=15&interval_id=100:90&action=\">\\xe5\\x86\\x92\\xe9\\x99\\xa9</a></span>\\n          <span><a href=\"/typerank?type_name=\\xe7\\x81\\xbe\\xe9\\x9a\\xbe&type=12&interval_id=100:90&action=\">\\xe7\\x81\\xbe\\xe9\\x9a\\xbe</a></span>\\n          <span><a href=\"/typerank?type_name=\\xe6\\xad\\xa6\\xe4\\xbe\\xa0&type=29&interval_id=100:90&action=\">\\xe6\\xad\\xa6\\xe4\\xbe\\xa0</a></span>\\n          <span><a href=\"/typerank?type_name=\\xe5\\x8f\\xa4\\xe8\\xa3\\x85&type=30&interval_id=100:90&action=\">\\xe5\\x8f\\xa4\\xe8\\xa3\\x85</a></span>\\n          <span><a href=\"/typerank?type_name=\\xe8\\xbf\\x90\\xe5\\x8a\\xa8&type=18&interval_id=100:90&action=\">\\xe8\\xbf\\x90\\xe5\\x8a\\xa8</a></span>\\n          <span><a href=\"/typerank?type_name=\\xe9\\xbb\\x91\\xe8\\x89\\xb2\\xe7\\x94\\xb5\\xe5\\xbd\\xb1&type=31&interval_id=100:90&action=\">\\xe9\\xbb\\x91\\xe8\\x89\\xb2\\xe7\\x94\\xb5\\xe5\\xbd\\xb1</a></span>\\n      </div>\\n  </div>\\n\\n    <!-- douban ad begin -->\\n    <div id=\"dale_movie_chart_top_right\"></div>\\n    <!-- douban ad end -->\\n\\n    \\n    <div class=\"movie_top\" id=\"ranking\">\\n    <div class=\"movie_top\" id=\"ranking\">\\n        \\n    \\n    \\n    <h2>\\xe4\\xb8\\x80\\xe5\\x91\\xa8\\xe5\\x8f\\xa3\\xe7\\xa2\\x91\\xe6\\xa6\\x9c\\xc2\\xb7 \\xc2\\xb7 \\xc2\\xb7 \\xc2\\xb7 \\xc2\\xb7 \\xc2\\xb7 <span class=\"box_chart_num color-gray\">3\\xe6\\x9c\\x8813\\xe6\\x97\\xa5 \\xe6\\x9b\\xb4\\xe6\\x96\\xb0</span></h2>\\n    <ul class=\"content\" id=\"listCont2\">\\n        <li class=\"clearfix\">\\n            <div class=\"no\">1</div>\\n            <div class=\"name\">\\n                <a onclick=\"moreurl(this, {from:\\'mv_week\\'})\" href=\"https://movie.douban.com/subject/30241298/\" class=\"\">\\n                    \\xe5\\x8d\\x97\\xe5\\xb1\\xb1\\xe7\\x9a\\x84\\xe9\\x83\\xa8\\xe9\\x95\\xbf\\xe4\\xbb\\xac\\n                </a>\\n            </div>\\n            <span class=\"\">\\n                    <div class=\"stay\">0</div>\\n            </span>\\n        </li>\\n        <li class=\"clearfix\">\\n            <div class=\"no\">2</div>\\n            <div class=\"name\">\\n                <a onclick=\"moreurl(this, {from:\\'mv_week\\'})\" href=\"https://movie.douban.com/subject/30479900/\" class=\"\">\\n                    \\xe6\\x88\\x91\\xe7\\x9c\\x9f\\xe6\\xad\\xa3\\xe7\\x9a\\x84\\xe5\\xa4\\xa9\\xe6\\x89\\x8d\\xe5\\xa5\\xb3\\xe5\\x8f\\x8b\\n                </a>\\n            </div>\\n            <span class=\"\">\\n                    <div class=\"up\">9</div>\\n            </span>\\n        </li>\\n        <li class=\"clearfix\">\\n            <div class=\"no\">3</div>\\n            <div class=\"name\">\\n                <a onclick=\"moreurl(this, {from:\\'mv_week\\'})\" href=\"https://movie.douban.com/subject/30447702/\" class=\"\">\\n                    \\xe5\\xbe\\xb7\\xe8\\x8f\\xb2\\xe5\\x9b\\xa0\\xe4\\xb8\\x8e\\xe5\\x8d\\xa1\\xe7\\xbd\\x97\\xe5\\xb0\\x94\\xef\\xbc\\x9a\\xe5\\x8f\\x8d\\xe5\\x8f\\x9b\\xe7\\xbc\\xaa\\xe6\\x96\\xaf\\n                </a>\\n            </div>\\n            <span class=\"\">\\n                    <div class=\"up\">8</div>\\n            </span>\\n        </li>\\n        <li class=\"clearfix\">\\n            <div class=\"no\">4</div>\\n            <div class=\"name\">\\n                <a onclick=\"moreurl(this, {from:\\'mv_week\\'})\" href=\"https://movie.douban.com/subject/33415922/\" class=\"\">\\n                    \\xe5\\x89\\xa9\\xe5\\xa5\\xb3\\n                </a>\\n            </div>\\n            <span class=\"\">\\n                    <div class=\"down\">2</div>\\n            </span>\\n        </li>\\n        <li class=\"clearfix\">\\n            <div class=\"no\">5</div>\\n            <div class=\"name\">\\n                <a onclick=\"moreurl(this, {from:\\'mv_week\\'})\" href=\"https://movie.douban.com/subject/34951277/\" class=\"\">\\n                    \\xe4\\xb8\\x8e\\xe7\\x88\\xb1\\xe5\\x90\\x8c\\xe5\\xb1\\x85\\xe4\\xb9\\x8b\\xe6\\xb0\\xb8\\xe6\\x81\\x92\\xe7\\x9a\\x84\\xe7\\x88\\xb1\\n                </a>\\n            </div>\\n            <span class=\"\">\\n                    <div class=\"up\">6</div>\\n            </span>\\n        </li>\\n        <li class=\"clearfix\">\\n            <div class=\"no\">6</div>\\n            <div class=\"name\">\\n                <a onclick=\"moreurl(this, {from:\\'mv_week\\'})\" href=\"https://movie.douban.com/subject/27040109/\" class=\"\">\\n                    \\xe7\\x8b\\x82\\xe8\\xba\\x81\\xe8\\x8a\\x82\\xe6\\x8b\\x8d\\n                </a>\\n            </div>\\n            <span class=\"\">\\n                    <div class=\"down\">3</div>\\n            </span>\\n        </li>\\n        <li class=\"clearfix\">\\n            <div class=\"no\">7</div>\\n            <div class=\"name\">\\n                <a onclick=\"moreurl(this, {from:\\'mv_week\\'})\" href=\"https://movie.douban.com/subject/27046645/\" class=\"\">\\n                    \\xe9\\x9b\\xb7\\xe7\\xb1\\xb3\\xe5\\xa5\\x87\\xe9\\x81\\x87\\xe8\\xae\\xb0\\n                </a>\\n            </div>\\n            <span class=\"\">\\n                    <div class=\"down\">2</div>\\n            </span>\\n        </li>\\n        <li class=\"clearfix\">\\n            <div class=\"no\">8</div>\\n            <div class=\"name\">\\n                <a onclick=\"moreurl(this, {from:\\'mv_week\\'})\" href=\"https://movie.douban.com/subject/27107766/\" class=\"\">\\n                    \\xe7\\xbb\\xb4\\xe5\\xa1\\x94\\xe5\\x88\\xa9\\xe5\\xa8\\x9c\\xc2\\xb7\\xe7\\x93\\xa6\\xe9\\x9b\\xb7\\xe6\\x8b\\x89\\n                </a>\\n            </div>\\n            <span class=\"\">\\n                    <div class=\"down\">1</div>\\n            </span>\\n        </li>\\n        <li class=\"clearfix\">\\n            <div class=\"no\">9</div>\\n            <div class=\"name\">\\n                <a onclick=\"moreurl(this, {from:\\'mv_week\\'})\" href=\"https://movie.douban.com/subject/30427480/\" class=\"\">\\n                    \\xe7\\xb3\\xbb\\xe7\\xbb\\x9f\\xe7\\xa0\\xb4\\xe5\\x9d\\x8f\\xe8\\x80\\x85\\n                </a>\\n            </div>\\n            <span class=\"\">\\n                    <div class=\"down\">1</div>\\n            </span>\\n        </li>\\n        <li class=\"clearfix\">\\n            <div class=\"no\">10</div>\\n            <div class=\"name\">\\n                <a onclick=\"moreurl(this, {from:\\'mv_week\\'})\" href=\"https://movie.douban.com/subject/30152072/\" class=\"\">\\n                    \\xe5\\xae\\x89\\xe5\\xb0\\xbc\\xe4\\xba\\x9a\\xe6\\x8b\\x89\\xe5\\x8f\\xb7\\n                </a>\\n            </div>\\n            <span class=\"\">\\n                    <div class=\"stay\">0</div>\\n            </span>\\n        </li>\\n    </ul>\\n\\n    </div>\\n\\n    <div class=\"movie_top\" id=\"ranking\">\\n        \\n    \\n    <h2>\\xe5\\x8c\\x97\\xe7\\xbe\\x8e\\xe7\\xa5\\xa8\\xe6\\x88\\xbf\\xe6\\xa6\\x9c\\xc2\\xb7 \\xc2\\xb7 \\xc2\\xb7 \\xc2\\xb7 \\xc2\\xb7 \\xc2\\xb7 <span class=\"box_chart_num color-gray\">3\\xe6\\x9c\\x8813\\xe6\\x97\\xa5 \\xe6\\x9b\\xb4\\xe6\\x96\\xb0 / \\xe7\\xbe\\x8e\\xe5\\x85\\x83</span></h2>\\n    <ul class=\"content\" id=\"listCont1\">\\n            \\n                <li class=\"clearfix\">\\n                    <div class=\"no\">1</div>\\n                    <div class=\"box_chart\">\\n                        <a onclick=\"moreurl(this, {from:\\'mv_us_week\\'})\" href=\"https://movie.douban.com/subject/30401849/\" class=\"\">\\n                            1/2\\xe7\\x9a\\x84\\xe9\\xad\\x94\\xe6\\xb3\\x95\\n                        </a>\\n                    </div>\\n                    <span class=\"box_chart_num color-gray\">1053\\xe4\\xb8\\x87</span>\\n                </li>\\n            \\n                <li class=\"clearfix\">\\n                    <div class=\"no\">2</div>\\n                    <div class=\"box_chart\">\\n                        <a onclick=\"moreurl(this, {from:\\'mv_us_week\\'})\" href=\"https://movie.douban.com/subject/34802738/\" class=\"\">\\n                            \\xe6\\x88\\x91\\xe4\\xbb\\x8d\\xe7\\x84\\xb6\\xe7\\x9b\\xb8\\xe4\\xbf\\xa1\\n                        </a>\\n                                <img src=\"https://img3.doubanio.com/f/shire/267048ed5190c4c6b513c2e559cae7ae8b8f0af5/pics/box_new.png\" />\\n                    </div>\\n                    <span class=\"box_chart_num color-gray\">950\\xe4\\xb8\\x87</span>\\n                </li>\\n            \\n                <li class=\"clearfix\">\\n                    <div class=\"no\">3</div>\\n                    <div class=\"box_chart\">\\n                        <a onclick=\"moreurl(this, {from:\\'mv_us_week\\'})\" href=\"https://movie.douban.com/subject/4830483/\" class=\"\">\\n                            \\xe5\\x96\\x8b\\xe8\\xa1\\x80\\xe6\\x88\\x98\\xe5\\xa3\\xab\\n                        </a>\\n                                <img src=\"https://img3.doubanio.com/f/shire/267048ed5190c4c6b513c2e559cae7ae8b8f0af5/pics/box_new.png\" />\\n                    </div>\\n                    <span class=\"box_chart_num color-gray\">930\\xe4\\xb8\\x87</span>\\n                </li>\\n            \\n                <li class=\"clearfix\">\\n                    <div class=\"no\">4</div>\\n                    <div class=\"box_chart\">\\n                        <a onclick=\"moreurl(this, {from:\\'mv_us_week\\'})\" href=\"https://movie.douban.com/subject/2364086/\" class=\"\">\\n                            \\xe9\\x9a\\x90\\xe5\\xbd\\xa2\\xe4\\xba\\xba\\n                        </a>\\n                    </div>\\n                    <span class=\"box_chart_num color-gray\">600\\xe4\\xb8\\x87</span>\\n                </li>\\n            \\n                <li class=\"clearfix\">\\n                    <div class=\"no\">5</div>\\n                    <div class=\"box_chart\">\\n                        <a onclick=\"moreurl(this, {from:\\'mv_us_week\\'})\" href=\"https://movie.douban.com/subject/30182726/\" class=\"\">\\n                            \\xe7\\x8b\\xa9\\xe7\\x8c\\x8e\\n                        </a>\\n                                <img src=\"https://img3.doubanio.com/f/shire/267048ed5190c4c6b513c2e559cae7ae8b8f0af5/pics/box_new.png\" />\\n                    </div>\\n                    <span class=\"box_chart_num color-gray\">532\\xe4\\xb8\\x87</span>\\n                </li>\\n            \\n                <li class=\"clearfix\">\\n                    <div class=\"no\">6</div>\\n                    <div class=\"box_chart\">\\n                        <a onclick=\"moreurl(this, {from:\\'mv_us_week\\'})\" href=\"https://movie.douban.com/subject/25905044/\" class=\"\">\\n                            \\xe5\\x88\\xba\\xe7\\x8c\\xac\\xe7\\xb4\\xa2\\xe5\\xb0\\xbc\\xe5\\x85\\x8b\\n                        </a>\\n                    </div>\\n                    <span class=\"box_chart_num color-gray\">258\\xe4\\xb8\\x87</span>\\n                </li>\\n            \\n                <li class=\"clearfix\">\\n                    <div class=\"no\">7</div>\\n                    <div class=\"box_chart\">\\n                        <a onclick=\"moreurl(this, {from:\\'mv_us_week\\'})\" href=\"https://movie.douban.com/subject/30345227/\" class=\"\">\\n                            \\xe5\\x9b\\x9e\\xe5\\xbd\\x92\\xe4\\xb9\\x8b\\xe8\\xb7\\xaf\\n                        </a>\\n                    </div>\\n                    <span class=\"box_chart_num color-gray\">242\\xe4\\xb8\\x87</span>\\n                </li>\\n            \\n                <li class=\"clearfix\">\\n                    <div class=\"no\">8</div>\\n                    <div class=\"box_chart\">\\n                        <a onclick=\"moreurl(this, {from:\\'mv_us_week\\'})\" href=\"https://movie.douban.com/subject/27199324/\" class=\"\">\\n                            \\xe9\\x87\\x8e\\xe6\\x80\\xa7\\xe7\\x9a\\x84\\xe5\\x91\\xbc\\xe5\\x94\\xa4\\n                        </a>\\n                    </div>\\n                    <span class=\"box_chart_num color-gray\">224\\xe4\\xb8\\x87</span>\\n                </li>\\n            \\n                <li class=\"clearfix\">\\n                    <div class=\"no\">9</div>\\n                    <div class=\"box_chart\">\\n                        <a onclick=\"moreurl(this, {from:\\'mv_us_week\\'})\" href=\"https://movie.douban.com/subject/30361878/\" class=\"\">\\n                            \\xe7\\x88\\xb1\\xe7\\x8e\\x9b\\n                        </a>\\n                    </div>\\n                    <span class=\"box_chart_num color-gray\">137\\xe4\\xb8\\x87</span>\\n                </li>\\n            \\n                <li class=\"clearfix\">\\n                    <div class=\"no\">10</div>\\n                    <div class=\"box_chart\">\\n                        <a onclick=\"moreurl(this, {from:\\'mv_us_week\\'})\" href=\"https://movie.douban.com/subject/4014397/\" class=\"\">\\n                            \\xe7\\xbb\\x9d\\xe5\\x9c\\xb0\\xe6\\x88\\x98\\xe8\\xad\\xa6\\xef\\xbc\\x9a\\xe7\\x96\\xbe\\xe9\\x80\\x9f\\xe8\\xbf\\xbd\\xe5\\x87\\xbb\\n                        </a>\\n                    </div>\\n                    <span class=\"box_chart_num color-gray\">110\\xe4\\xb8\\x87</span>\\n                </li>\\n    </ul>\\n\\n    </div>\\n\\n    <!-- douban ad begin -->\\n    \\n\\n\\n\\n\\n\\n<div class=\"mobile-app-entrance block5 app-movie\">\\n    <a class=\"entrance-link\" href=\"https://www.douban.com/doubanapp/frodo\">\\n        <div class=\"entrance-qrcode\">\\n            <img src=\"https://img3.doubanio.com/f/movie/a02f6ed325fc52e220f299d51e730c422e2bcd16/pics/movie/douban_app_ad/qrcode.png\" alt=\"\\xe6\\x89\\xab\\xe7\\xa0\\x81\\xe4\\xb8\\x8b\\xe8\\xbd\\xbd\\xe8\\xb1\\x86\\xe7\\x93\\xa3 App\" width=\"80\" height=\"80\" />\\n        </div>\\n        <div class=\"entrance-info\">\\n            <span class=\"app-icon icon-movie\"></span>\\n            <span class=\"main-title\">\\xe8\\xb1\\x86\\xe7\\x93\\xa3</span>\\n            <span class=\"sub-title\">\\xe4\\xbd\\xa0\\xe7\\x9a\\x84\\xe7\\xa7\\xbb\\xe5\\x8a\\xa8\\xe8\\xa7\\x82\\xe5\\xbd\\xb1\\xe6\\x8c\\x87\\xe5\\x8d\\x97</span>\\n        </div>\\n    </a>\\n</div>\\n\\n    <!-- douban ad end -->\\n\\n        <div class=\"indent\">\\n            \\n    <div id=\"douban-top250\">\\n        <div class=\"douban-top250-hd\">\\n            <h2>\\xe8\\xb1\\x86\\xe7\\x93\\xa3\\xe7\\x94\\xb5\\xe5\\xbd\\xb1TOP250\\n                <span>\\n                    <a href=\"https://movie.douban.com/top250\">\\xe5\\x85\\xa8\\xe9\\x83\\xa8&nbsp;</a>\\n                </span>\\n            </h2>\\n        </div>\\n        <div class=\"douban-top250-bd\">\\n            \\n        <dl class=\"\">\\n            <dt>\\n                <a onclick=\"moreurl(this, {from:\\'mv_tops\\'})\" href=\"https://movie.douban.com/subject/1304447/?from=top250\">\\n                    <img src=\"https://img3.doubanio.com/view/photo/s_ratio_poster/public/p641688453.jpg\" class=\"m_sub_img\"/>\\n                </a>\\n            </dt>\\n            <dd>\\n                <a onclick=\"moreurl(this, {from:\\'mv_tops\\'})\" href=\"https://movie.douban.com/subject/1304447/?from=top250\" class=\"\">\\n                    \\xe8\\xae\\xb0\\xe5\\xbf\\x86\\xe7\\xa2\\x8e\\xe7\\x89\\x87\\n                </a>\\n                <span class=\"gact\"></span><br/>\\n            </dd>\\n        </dl>\\n        <dl class=\"\">\\n            <dt>\\n                <a onclick=\"moreurl(this, {from:\\'mv_tops\\'})\" href=\"https://movie.douban.com/subject/1793929/?from=top250\">\\n                    <img src=\"https://img1.doubanio.com/view/photo/s_ratio_poster/public/p2166160837.jpg\" class=\"m_sub_img\"/>\\n                </a>\\n            </dt>\\n            <dd>\\n                <a onclick=\"moreurl(this, {from:\\'mv_tops\\'})\" href=\"https://movie.douban.com/subject/1793929/?from=top250\" class=\"\">\\n                    \\xe8\\xbe\\xbe\\xe6\\x8b\\x89\\xe6\\x96\\xaf\\xe4\\xb9\\xb0\\xe5\\xae\\xb6\\xe4\\xbf\\xb1\\xe4\\xb9\\x90\\xe9\\x83\\xa8\\n                </a>\\n                <span class=\"gact\"></span><br/>\\n            </dd>\\n        </dl>\\n        <dl class=\"\">\\n            <dt>\\n                <a onclick=\"moreurl(this, {from:\\'mv_tops\\'})\" href=\"https://movie.douban.com/subject/1299131/?from=top250\">\\n                    <img src=\"https://img1.doubanio.com/view/photo/s_ratio_poster/public/p2194138787.jpg\" class=\"m_sub_img\"/>\\n                </a>\\n            </dt>\\n            <dd>\\n                <a onclick=\"moreurl(this, {from:\\'mv_tops\\'})\" href=\"https://movie.douban.com/subject/1299131/?from=top250\" class=\"\">\\n                    \\xe6\\x95\\x99\\xe7\\x88\\xb62\\n                </a>\\n                <span class=\"gact\"></span><br/>\\n            </dd>\\n        </dl>\\n            <div class=\"clearfix rr\" style=\"width:100%\"></div>\\n        <dl class=\"\">\\n            <dt>\\n                <a onclick=\"moreurl(this, {from:\\'mv_tops\\'})\" href=\"https://movie.douban.com/subject/1291568/?from=top250\">\\n                    <img src=\"https://img9.doubanio.com/view/photo/s_ratio_poster/public/p1925331564.jpg\" class=\"m_sub_img\"/>\\n                </a>\\n            </dt>\\n            <dd>\\n                <a onclick=\"moreurl(this, {from:\\'mv_tops\\'})\" href=\"https://movie.douban.com/subject/1291568/?from=top250\" class=\"\">\\n                    \\xe4\\xb8\\x9c\\xe4\\xba\\xac\\xe7\\x89\\xa9\\xe8\\xaf\\xad\\n                </a>\\n                <span class=\"gact\"></span><br/>\\n            </dd>\\n        </dl>\\n        <dl class=\"\">\\n            <dt>\\n                <a onclick=\"moreurl(this, {from:\\'mv_tops\\'})\" href=\"https://movie.douban.com/subject/1787291/?from=top250\">\\n                    <img src=\"https://img9.doubanio.com/view/photo/s_ratio_poster/public/p884763596.jpg\" class=\"m_sub_img\"/>\\n                </a>\\n            </dt>\\n            <dd>\\n                <a onclick=\"moreurl(this, {from:\\'mv_tops\\'})\" href=\"https://movie.douban.com/subject/1787291/?from=top250\" class=\"\">\\n                    \\xe8\\xa2\\xab\\xe5\\xab\\x8c\\xe5\\xbc\\x83\\xe7\\x9a\\x84\\xe6\\x9d\\xbe\\xe5\\xad\\x90\\xe7\\x9a\\x84\\xe4\\xb8\\x80\\xe7\\x94\\x9f\\n                </a>\\n                <span class=\"gact\"></span><br/>\\n            </dd>\\n        </dl>\\n        <dl class=\"\">\\n            <dt>\\n                <a onclick=\"moreurl(this, {from:\\'mv_tops\\'})\" href=\"https://movie.douban.com/subject/1302425/?from=top250\">\\n                    <img src=\"https://img1.doubanio.com/view/photo/s_ratio_poster/public/p2579932167.jpg\" class=\"m_sub_img\"/>\\n                </a>\\n            </dt>\\n            <dd>\\n                <a onclick=\"moreurl(this, {from:\\'mv_tops\\'})\" href=\"https://movie.douban.com/subject/1302425/?from=top250\" class=\"\">\\n                    \\xe5\\x96\\x9c\\xe5\\x89\\xa7\\xe4\\xb9\\x8b\\xe7\\x8e\\x8b\\n                </a>\\n                <span class=\"gact\"></span><br/>\\n            </dd>\\n        </dl>\\n            <div class=\"clearfix rr\" style=\"width:100%\"></div>\\n        <dl class=\"\">\\n            <dt>\\n                <a onclick=\"moreurl(this, {from:\\'mv_tops\\'})\" href=\"https://movie.douban.com/subject/1307811/?from=top250\">\\n                    <img src=\"https://img3.doubanio.com/view/photo/s_ratio_poster/public/p456676352.jpg\" class=\"m_sub_img\"/>\\n                </a>\\n            </dt>\\n            <dd>\\n                <a onclick=\"moreurl(this, {from:\\'mv_tops\\'})\" href=\"https://movie.douban.com/subject/1307811/?from=top250\" class=\"\">\\n                    \\xe9\\xad\\x94\\xe5\\xa5\\xb3\\xe5\\xae\\x85\\xe6\\x80\\xa5\\xe4\\xbe\\xbf\\n                </a>\\n                <span class=\"gact\"></span><br/>\\n            </dd>\\n        </dl>\\n        <dl class=\"\">\\n            <dt>\\n                <a onclick=\"moreurl(this, {from:\\'mv_tops\\'})\" href=\"https://movie.douban.com/subject/3592854/?from=top250\">\\n                    <img src=\"https://img3.doubanio.com/view/photo/s_ratio_poster/public/p2236181653.jpg\" class=\"m_sub_img\"/>\\n                </a>\\n            </dt>\\n            <dd>\\n                <a onclick=\"moreurl(this, {from:\\'mv_tops\\'})\" href=\"https://movie.douban.com/subject/3592854/?from=top250\" class=\"\">\\n                    \\xe7\\x96\\xaf\\xe7\\x8b\\x82\\xe7\\x9a\\x84\\xe9\\xba\\xa6\\xe5\\x85\\x8b\\xe6\\x96\\xaf4\\xef\\xbc\\x9a\\xe7\\x8b\\x82\\xe6\\x9a\\xb4\\xe4\\xb9\\x8b\\xe8\\xb7\\xaf\\n                </a>\\n                <span class=\"gact\"></span><br/>\\n            </dd>\\n        </dl>\\n        <dl class=\"\">\\n            <dt>\\n                <a onclick=\"moreurl(this, {from:\\'mv_tops\\'})\" href=\"https://movie.douban.com/subject/1292434/?from=top250\">\\n                    <img src=\"https://img3.doubanio.com/view/photo/s_ratio_poster/public/p2567845803.jpg\" class=\"m_sub_img\"/>\\n                </a>\\n            </dt>\\n            <dd>\\n                <a onclick=\"moreurl(this, {from:\\'mv_tops\\'})\" href=\"https://movie.douban.com/subject/1292434/?from=top250\" class=\"\">\\n                    \\xe4\\xb8\\x80\\xe4\\xb8\\x80\\n                </a>\\n                <span class=\"gact\"></span><br/>\\n            </dd>\\n        </dl>\\n            <div class=\"clearfix rr\" style=\"width:100%\"></div>\\n        <dl class=\"\">\\n            <dt>\\n                <a onclick=\"moreurl(this, {from:\\'mv_tops\\'})\" href=\"https://movie.douban.com/subject/1291858/?from=top250\">\\n                    <img src=\"https://img1.doubanio.com/view/photo/s_ratio_poster/public/p2553104888.jpg\" class=\"m_sub_img\"/>\\n                </a>\\n            </dt>\\n            <dd>\\n                <a onclick=\"moreurl(this, {from:\\'mv_tops\\'})\" href=\"https://movie.douban.com/subject/1291858/?from=top250\" class=\"\">\\n                    \\xe9\\xac\\xbc\\xe5\\xad\\x90\\xe6\\x9d\\xa5\\xe4\\xba\\x86\\n                </a>\\n                <span class=\"gact\"></span><br/>\\n            </dd>\\n        </dl>\\n        <dl class=\"\">\\n            <dt>\\n                <a onclick=\"moreurl(this, {from:\\'mv_tops\\'})\" href=\"https://movie.douban.com/subject/26430107/?from=top250\">\\n                    <img src=\"https://img1.doubanio.com/view/photo/s_ratio_poster/public/p2457609817.jpg\" class=\"m_sub_img\"/>\\n                </a>\\n            </dt>\\n            <dd>\\n                <a onclick=\"moreurl(this, {from:\\'mv_tops\\'})\" href=\"https://movie.douban.com/subject/26430107/?from=top250\" class=\"\">\\n                    \\xe4\\xba\\x8c\\xe5\\x8d\\x81\\xe4\\xba\\x8c\\n                </a>\\n                <span class=\"gact\"></span><br/>\\n            </dd>\\n        </dl>\\n        <dl class=\"\">\\n            <dt>\\n                <a onclick=\"moreurl(this, {from:\\'mv_tops\\'})\" href=\"https://movie.douban.com/subject/6534248/?from=top250\">\\n                    <img src=\"https://img9.doubanio.com/view/photo/s_ratio_poster/public/p1735642656.jpg\" class=\"m_sub_img\"/>\\n                </a>\\n            </dt>\\n            <dd>\\n                <a onclick=\"moreurl(this, {from:\\'mv_tops\\'})\" href=\"https://movie.douban.com/subject/6534248/?from=top250\" class=\"\">\\n                    \\xe6\\x97\\xa0\\xe6\\x95\\x8c\\xe7\\xa0\\xb4\\xe5\\x9d\\x8f\\xe7\\x8e\\x8b\\n                </a>\\n                <span class=\"gact\"></span><br/>\\n            </dd>\\n        </dl>\\n            <div class=\"clearfix rr\" style=\"width:100%\"></div>\\n\\n        </div>\\n    </div>\\n    \\n\\n        </div>\\n    </div>\\n\\n            </div>\\n            <div class=\"extra\">\\n                \\n    <!-- douban ad begin -->\\n    <div id=\"dale_movie_chart_bottom_banner\"></div>\\n    <!-- douban ad end -->\\n\\n            </div>\\n        </div>\\n    </div>\\n\\n        \\n    <div id=\"footer\">\\n            <div class=\"footer-extra\"></div>\\n        \\n<span id=\"icp\" class=\"fleft gray-link\">\\n    &copy; 2005\\xef\\xbc\\x8d2020 douban.com, all rights reserved \\xe5\\x8c\\x97\\xe4\\xba\\xac\\xe8\\xb1\\x86\\xe7\\xbd\\x91\\xe7\\xa7\\x91\\xe6\\x8a\\x80\\xe6\\x9c\\x89\\xe9\\x99\\x90\\xe5\\x85\\xac\\xe5\\x8f\\xb8\\n</span>\\n\\n<a href=\"https://www.douban.com/hnypt/variformcyst.py\" style=\"display: none;\"></a>\\n\\n<span class=\"fright\">\\n    <a href=\"https://www.douban.com/about\">\\xe5\\x85\\xb3\\xe4\\xba\\x8e\\xe8\\xb1\\x86\\xe7\\x93\\xa3</a>\\n    \\xc2\\xb7 <a href=\"https://www.douban.com/jobs\">\\xe5\\x9c\\xa8\\xe8\\xb1\\x86\\xe7\\x93\\xa3\\xe5\\xb7\\xa5\\xe4\\xbd\\x9c</a>\\n    \\xc2\\xb7 <a href=\"https://www.douban.com/about?topic=contactus\">\\xe8\\x81\\x94\\xe7\\xb3\\xbb\\xe6\\x88\\x91\\xe4\\xbb\\xac</a>\\n    \\xc2\\xb7 <a href=\"https://www.douban.com/about/legal\">\\xe6\\xb3\\x95\\xe5\\xbe\\x8b\\xe5\\xa3\\xb0\\xe6\\x98\\x8e</a>\\n    \\n    \\xc2\\xb7 <a href=\"https://help.douban.com/?app=movie\" target=\"_blank\">\\xe5\\xb8\\xae\\xe5\\x8a\\xa9\\xe4\\xb8\\xad\\xe5\\xbf\\x83</a>\\n    \\xc2\\xb7 <a href=\"https://www.douban.com/doubanapp/\">\\xe7\\xa7\\xbb\\xe5\\x8a\\xa8\\xe5\\xba\\x94\\xe7\\x94\\xa8</a>\\n    \\xc2\\xb7 <a href=\"https://www.douban.com/partner/\">\\xe8\\xb1\\x86\\xe7\\x93\\xa3\\xe5\\xb9\\xbf\\xe5\\x91\\x8a</a>\\n</span>\\n\\n    </div>\\n\\n    </div>\\n    <!-- COLLECTED JS -->\\n        \\n        \\n    <link rel=\"stylesheet\" type=\"text/css\" href=\"https://img3.doubanio.com/f/shire/8377b9498330a2e6f056d863987cc7a37eb4d486/css/ui/dialog.css\" />\\n    <link rel=\"stylesheet\" type=\"text/css\" href=\"https://img3.doubanio.com/f/movie/4aca95d66d37ec0712b3d19973b5d8feb75f2f05/css/movie/mod/reg_login_pop.css\" />\\n    <script type=\"text/javascript\" src=\"https://img3.doubanio.com/f/shire/77323ae72a612bba8b65f845491513ff3329b1bb/js/do.js\" data-cfg-autoload=\"false\"></script>\\n    <script type=\"text/javascript\" src=\"https://img3.doubanio.com/f/shire/383a6e43f2108dc69e3ff2681bc4dc6c72a5ffb0/js/ui/dialog.js\"></script>\\n    <script type=\"text/javascript\">\\n        var HTTPS_DB=\\'https://www.douban.com\\';\\nvar account_pop={open:function(o,e){e?referrer=\"?referrer=\"+encodeURIComponent(e):referrer=\"?referrer=\"+window.location.href;var n=\"\",i=\"\",t=448;n=\"\\xe7\\x94\\xa8\\xe6\\x88\\xb7\\xe7\\x99\\xbb\\xe5\\xbd\\x95\",i=\"https://accounts.douban.com/passport/login_popup?source=movie\";var r=document.location.protocol+\"//\"+document.location.hostname,a=dui.Dialog({width:340,title:n,height:t,cls:\"account_pop\",isHideTitle:!0,modal:!0,content:\"<iframe scrolling=\\'no\\' frameborder=\\'0\\' width=\\'340\\' height=\\'\"+t+\"\\' src=\\'\"+i+\"\\' name=\\'\"+r+\"\\'></iframe>\"},!0),c=a.node;if(c.undelegate(),c.delegate(\".dui-dialog-close\",\"click\",function(){var o=$(\"body\");o.find(\"#login_msk\").hide(),o.find(\".account_pop\").remove()}),$(window).width()<478){var d=\"\";\"reg\"===o?d=HTTPS_DB+\"/accounts/register\"+referrer:\"login\"===o&&(d=HTTPS_DB+\"/accounts/login\"+referrer),window.location.href=d}else a.open();$(window).bind(\"message\",function(o){\"https://accounts.douban.com\"===o.originalEvent.origin&&(c.find(\"iframe\").css(\"height\",o.originalEvent.data),c.height(o.originalEvent.data),a.update())})}};Douban&&Douban.init_show_login&&(Douban.init_show_login=function(o){var e=$(o);e.click(function(){var o=e.data(\"ref\")||\"\";return account_pop.open(\"login\",o),!1})}),Do(function(){$(\"body\").delegate(\".pop_register\",\"click\",function(o){o.preventDefault();var e=$(this).data(\"ref\")||\"\";return account_pop.open(\"reg\",e),!1}),$(\"body\").delegate(\".pop_login\",\"click\",function(o){o.preventDefault();var e=$(this).data(\"ref\")||\"\";return account_pop.open(\"login\",e),!1})});\\n    </script>\\n\\n    \\n    <!-- douban ad begin -->\\n    \\n\\n\\n\\n\\n    \\n<script type=\"text/javascript\">\\n    (function (global) {\\n        var newNode = global.document.createElement(\\'script\\'),\\n            existingNode = global.document.getElementsByTagName(\\'script\\')[0],\\n            adSource = \\'//erebor.douban.com/\\',\\n            userId = \\'\\',\\n            browserId = \\'49dkYAMfWAw\\',\\n            criteria = \\'3:/chart\\',\\n            preview = \\'\\',\\n            debug = false,\\n            adSlots = [\\'dale_movie_chart_top_right\\', \\'dale_movie_chart_bottom_banner\\'];\\n\\n        global.DoubanAdRequest = {src: adSource, uid: userId, bid: browserId, crtr: criteria, prv: preview, debug: debug};\\n        global.DoubanAdSlots = (global.DoubanAdSlots || []).concat(adSlots);\\n\\n        newNode.setAttribute(\\'type\\', \\'text/javascript\\');\\n        newNode.setAttribute(\\'src\\', \\'//img1.doubanio.com/eDRjYjNvdi9mL2FkanMvZTQ2YTNkMjgwYjBiMzc2OWE4YTI3MWFhMzI0NTQwMTBlMWY3OTYzMy9hZC5yZWxlYXNlLmpz\\');\\n        newNode.setAttribute(\\'async\\', true);\\n        existingNode.parentNode.insertBefore(newNode, existingNode);\\n    })(this);\\n</script>\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n    <!-- douban ad end -->\\n\\n    \\n  \\n\\n\\n\\n\\n\\n\\n\\n\\n\\n<script type=\"text/javascript\">\\nvar _paq = _paq || [];\\n_paq.push([\\'trackPageView\\']);\\n_paq.push([\\'enableLinkTracking\\']);\\n(function() {\\n    var p=((\\'https:\\' == document.location.protocol) ? \\'https\\' : \\'http\\'), u=p+\\'://fundin.douban.com/\\';\\n    _paq.push([\\'setTrackerUrl\\', u+\\'piwik\\']);\\n    _paq.push([\\'setSiteId\\', \\'100001\\']);\\n    var d=document, g=d.createElement(\\'script\\'), s=d.getElementsByTagName(\\'script\\')[0];\\n    g.type=\\'text/javascript\\';\\n    g.defer=true;\\n    g.async=true;\\n    g.src=p+\\'://img3.doubanio.com/dae/fundin/piwik.js\\';\\n    s.parentNode.insertBefore(g,s);\\n})();\\n</script>\\n\\n<script type=\"text/javascript\">\\nvar setMethodWithNs = function(namespace) {\\n  var ns = namespace ? namespace + \\'.\\' : \\'\\'\\n    , fn = function(string) {\\n        if(!ns) {return string}\\n        return ns + string\\n      }\\n  return fn\\n}\\n\\nvar gaWithNamespace = function(fn, namespace) {\\n  var method = setMethodWithNs(namespace)\\n  fn.call(this, method)\\n}\\n\\nvar _gaq = _gaq || []\\n  , accounts = [\\n      { id: \\'UA-7019765-1\\', namespace: \\'douban\\' }\\n    , { id: \\'UA-7019765-19\\', namespace: \\'\\' }\\n    ]\\n  , gaInit = function(account) {\\n      gaWithNamespace(function(method) {\\n        gaInitFn.call(this, method, account)\\n      }, account.namespace)\\n    }\\n  , gaInitFn = function(method, account) {\\n      _gaq.push([method(\\'_setAccount\\'), account.id]);\\n      _gaq.push([method(\\'_setSampleRate\\'), \\'5\\']);\\n\\n      \\n  _gaq.push([method(\\'_addOrganic\\'), \\'google\\', \\'q\\'])\\n  _gaq.push([method(\\'_addOrganic\\'), \\'baidu\\', \\'wd\\'])\\n  _gaq.push([method(\\'_addOrganic\\'), \\'soso\\', \\'w\\'])\\n  _gaq.push([method(\\'_addOrganic\\'), \\'youdao\\', \\'q\\'])\\n  _gaq.push([method(\\'_addOrganic\\'), \\'so.360.cn\\', \\'q\\'])\\n  _gaq.push([method(\\'_addOrganic\\'), \\'sogou\\', \\'query\\'])\\n  if (account.namespace) {\\n    _gaq.push([method(\\'_addIgnoredOrganic\\'), \\'\\xe8\\xb1\\x86\\xe7\\x93\\xa3\\'])\\n    _gaq.push([method(\\'_addIgnoredOrganic\\'), \\'douban\\'])\\n    _gaq.push([method(\\'_addIgnoredOrganic\\'), \\'\\xe8\\xb1\\x86\\xe7\\x93\\xa3\\xe7\\xbd\\x91\\'])\\n    _gaq.push([method(\\'_addIgnoredOrganic\\'), \\'www.douban.com\\'])\\n  }\\n\\n      if (account.namespace === \\'douban\\') {\\n        _gaq.push([method(\\'_setDomainName\\'), \\'.douban.com\\'])\\n      }\\n\\n        _gaq.push([method(\\'_setCustomVar\\'), 1, \\'responsive_view_mode\\', \\'desktop\\', 3])\\n\\n        _gaq.push([method(\\'_setCustomVar\\'), 2, \\'login_status\\', \\'0\\', 2]);\\n\\n      _gaq.push([method(\\'_trackPageview\\')])\\n    }\\n\\nfor(var i = 0, l = accounts.length; i < l; i++) {\\n  var account = accounts[i]\\n  gaInit(account)\\n}\\n\\n\\n;(function() {\\n    var ga = document.createElement(\\'script\\');\\n    ga.src = (\\'https:\\' == document.location.protocol ? \\'https://ssl\\' : \\'http://www\\') + \\'.google-analytics.com/ga.js\\';\\n    ga.setAttribute(\\'async\\', \\'true\\');\\n    document.documentElement.firstChild.appendChild(ga);\\n})()\\n</script>\\n\\n\\n\\n\\n\\n\\n\\n\\n      \\n    \\n\\n    <!-- dae-web-movie--default-6d5d4d94c4-86qx2-->\\n\\n  <script>_SPLITTEST=\\'\\'</script>\\n</body>\\n\\n</html>\\n\\n\\n'\n"
     ]
    }
   ],
   "source": [
    "print (r.status_code, r.content)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 18,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "[Empty DataFrame\n",
       " Columns: []\n",
       " Index: [], Empty DataFrame\n",
       " Columns: [1917  / 1917：逆战救兵(港) / 一九一七  2019-12-25(美国) / 2020-01-10(英国) / 2020(中国大陆) / 乔治·麦凯 / 迪恩·查尔斯·查普曼 / 科林·费尔斯 / 本尼迪克特·康伯巴奇 / 马克·斯特朗 / 理查德·麦登 / 安德鲁·斯科特 / 丹尼尔·梅斯 / 阿德里安·斯卡伯勒 / 约翰·霍林沃思 / 克里斯·瓦利...  8.5  (152102人评价)]\n",
       " Index: [], Empty DataFrame\n",
       " Columns: [小妇人  / 她们(台)  2019-12-25(美国) / 2020(中国大陆) / 西尔莎·罗南 / 艾玛·沃森 / 弗洛伦斯·皮尤 / 伊莱扎·斯坎伦 / 劳拉·邓恩 / 蒂莫西·柴勒梅德 / 梅丽尔·斯特里普 / 鲍勃·奥登科克 / 詹姆斯·诺顿 / 路易·加瑞尔 / 克里斯·库珀 / 崔西·莱茨 / 艾比·奎因...  8.1  (118362人评价)]\n",
       " Index: [], Empty DataFrame\n",
       " Columns: [寄生虫  / 寄生上流(台) / 上流寄生族(港)  2019-05-21(戛纳电影节) / 2019-05-30(韩国) / 宋康昊 / 李善均 / 赵汝贞 / 崔宇植 / 朴素丹 / 李静恩 / 张慧珍 / 郑知晓 / 朴明勋 / 朴叙俊 / 朴根祿 / 郑贤俊 / 朴孝新 / 安德烈亚斯·弗龙克 / 郑益汉 / 李东勇 / 李柱亨 / 林艺恩 / 韩国 / 奉俊昊...  8.7  (894668人评价)]\n",
       " Index: [], Empty DataFrame\n",
       " Columns: [南山的部长们  / The Man Standing Next  2020-01-22(韩国) / 李秉宪 / 李星民 / 郭度沅 / 李熙俊 / 金素真 / 徐贤宇 / 朴智一 / 李泰亨 / 金昇勋 / 金明善 / 朴成根 / 郑钟宇 / 金民尚 / 周锡泰 / 成民秀 / 赵惠珠 / 孙炳旭 / 朴炫宇 / 严志满 / 柳正浩 / 金弘波 / 李东国 / 韩国 / 禹民镐...  8.2  (49775人评价)]\n",
       " Index: [], Empty DataFrame\n",
       " Columns: [猛禽小队和哈莉·奎茵  / 哈莉·奎因：猛禽小队 / 猛禽小队  2020-02-07(美国) / 玛格特·罗比 / 玛丽·伊丽莎白·温斯特德 / 罗茜·佩雷兹 / 朱尼·斯莫利特 / 伊万·麦克格雷格 / 埃拉·杰伊·巴斯科 / 克里斯·梅西纳 / 黄阿丽 / 戴维·尤里 / 萨拉·蒙特斯 / 伊莎贝尔·帕克扎德 / 丹尼尔·伯哈特 / 帕洛马·拉比诺夫...  5.9  (30201人评价)]\n",
       " Index: [], Empty DataFrame\n",
       " Columns: [小丑  / 小丑起源电影：罗密欧 / Romeo  2019-08-31(威尼斯电影节) / 2019-10-04(美国) / 华金·菲尼克斯 / 罗伯特·德尼罗 / 马克·马龙 / 莎姬·贝兹 / 谢伊·惠格姆 / 弗兰西丝·康罗伊 / 布莱恩·考伦 / 布莱恩·泰里·亨利 / 布莱特·卡伦 / 道格拉斯·霍奇斯 / 格伦·弗莱施勒 / 比尔·坎普...  8.7  (645927人评价)]\n",
       " Index: [], Empty DataFrame\n",
       " Columns: [乔乔的异想世界  / 乔乔兔 / 少年乔乔的异想世界  2019-09-08(多伦多电影节) / 2019-11-08(美国) / 2020(中国大陆) / 罗曼·格里芬·戴维斯 / 托马辛·麦肯齐 / 斯嘉丽·约翰逊 / 塔伊加·维迪提 / 山姆·洛克威尔 / 蕾蓓尔·威尔森 / 阿尔菲·艾伦 / 斯戴芬·莫昌特 / 阿奇·耶茨 / 卢克·布兰登·菲尔德...  8.4  (128547人评价)]\n",
       " Index: [], Empty DataFrame\n",
       " Columns: [阳光普照  / A Sun  2019-09-06(多伦多电影节) / 2019-11-01(中国台湾) / 陈以文 / 柯淑勤 / 巫建和 / 刘冠廷 / 许光汉 / 尹馨 / 温贞菱 / 吴岱凌 / 林志儒 / 龙劭华 / 胡鸿达 / 施名帅 / 张立东 / 张少怀 / 黄信尧 / 张翰 / 范姜泰基 / 张耀升 / 中国台湾 / 钟孟宏 / 155分钟...  8.4  (112475人评价)]\n",
       " Index: [], Empty DataFrame\n",
       " Columns: [利刃出鞘  / 致命遗产 / 锋回路转(台)  2019-09-07(多伦多电影节) / 2019-11-27(美国) / 2019-11-29(中国大陆) / 丹尼尔·克雷格 / 安娜·德·阿玛斯 / 克里斯·埃文斯 / 杰米·李·柯蒂斯 / 迈克尔·珊农 / 唐·约翰逊 / 托妮·科莱特 / 勒凯斯·斯坦菲尔德 / 克里斯托弗·普卢默 / 凯瑟琳·兰福德...  8.2  (392146人评价)]\n",
       " Index: [], Empty DataFrame\n",
       " Columns: [黑水  / 追击黑水真相(港) / 黑水风暴(台)  2019-11-22(美国点映) / 2019-12-06(美国) / 马克·鲁弗洛 / 安妮·海瑟薇 / 蒂姆·罗宾斯 / 比尔·坎普 / 维克多·加博 / 比尔·普尔曼 / 梅尔·温宁汉姆 / 威廉·杰克森·哈珀 / 路易莎·克劳瑟 / 凯文·克劳利 / 丹尼尔·R·希尔 / 王明 / 西尼·迈尔斯...  8.5  (39116人评价)]\n",
       " Index: []]"
      ]
     },
     "execution_count": 18,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df = pd.read_html(r.content, encoding=\"utf8\", header=0, index_col=0)\n",
    "df"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### 改试 requests + lxml\n",
    "该您了? 本周小作业\n",
    "\n",
    "1. 极易: prj00_例 liepin工作 找另外的工作 or prj00_例 图片新闻_Bing 找另外的图片\n",
    "2. 易: prj00_例 liepin工作 找另外的工作用不同的限定不同城市\n",
    "3. 中: prj00_例 liepin工作 找另外的工作 且 抽取（extract）出 薪水丶城市等信息\n",
    "3. 中: prj00_例 图片新闻_Bing 找另外的图片 找另外的工作 且 抽取出 图片丶图说等信息\n",
    "4. 难:  prj00_例 liepin工作 找另外的工作 且 抽取出 薪水丶城市等信息\n",
    "5. 难: prj00_例 图片新闻_Bing 你如何按栏目(i.e. 今日热图, 明星, 美女) 抽取出 图片丶图说等信息?\n",
    "6. 难: 豆瓣电影排行榜 你如何 ETL ( 抽取（extract）丶转换（transform）丶加载（load）至目的端) ?\n",
    "\n",
    "每个人需提交一个Github Jekyll 的本周小作业笔记的URL，建议是\n",
    "* 至少一个ipynb文档 或 \n",
    "* 一个markdown文档加一个ipynb文档(提交的入口点第一部分内容需要有另一个相关文档的链结及简要说明)\n",
    "\n",
    "\n"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "---\n",
    "结束\n"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.7.4"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 2
}
